{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 准备，导入对应模块"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 317,
   "metadata": {},
   "outputs": [],
   "source": [
    "from selenium import webdriver\n",
    "from selenium.webdriver.common.desired_capabilities import DesiredCapabilities\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "from lxml.html import fromstring\n",
    "import time\n",
    "from requests_html import HTMLSession\n",
    "import pprint\n",
    "import requests\n",
    "import base64\n",
    "from PIL  import Image\n",
    "import json\n",
    "import re\n",
    "import random"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 260,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-260-7e10cfaa9771>:15: DeprecationWarning: use options instead of chrome_options\n",
      "  driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps,\n"
     ]
    }
   ],
   "source": [
    "#caps=dict()\n",
    "#caps[\"pageLoadStrategy\"] = \"none\"   # Do not wait for full page load\n",
    "\n",
    "opts = webdriver.ChromeOptions()\n",
    "opts.add_argument('--no-sandbox')#解决DevToolsActivePort文件不存在的报错\n",
    "opts.add_argument('window-size=1920x3000') #指定浏览器分辨率\n",
    "opts.add_argument('--disable-gpu') #谷歌文档提到需要加上一这个属性来规避bug\n",
    "opts.add_argument('--hide-scrollbars') #隐藏滚动条, 应对些特殊页面\n",
    "#opts.add_argument('blink-settings=imagesEnabled=false') #不加载图片, 提升速度\n",
    "#opts.add_argument('--headless') #浏览器不提供可视化页面. linux下如果系统不支持可视化不加这条会启动失败\n",
    "# opts.binary_location = \"C:\\portable\\PortableApps\\IronPortable\\App\\Iron\\chrome.exe\"\n",
    "# opts.binary_location = \"C:\\Program Files\\Google\\Chrome\\Application\\chromedriver.exe\" #\"H:\\_coding_\\Gitee\\InternetNewMedia\\CapstonePrj2016\\chromedriver.exe\"  \n",
    "\n",
    "\n",
    "driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps,"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 261,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 进入知网"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 262,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.get(\"https://www.cnki.net/\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 263,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 检查是否是 “中山大学南方学院”登录"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 264,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "''"
      ]
     },
     "execution_count": 264,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "driver.find_element_by_id('Ecp_loginShowName1').get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 265,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 高级检索"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 266,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_id('highSearch').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 267,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 窗口检查"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 268,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'CDwindow-629082E3B45570093EBFC0633EC53B94'"
      ]
     },
     "execution_count": 268,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "driver.current_window_handle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 269,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 所有窗口"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 270,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-629082E3B45570093EBFC0633EC53B94',\n",
       " 'CDwindow-3C3BD51F846E1D8E34ABBE5D4B52E434']"
      ]
     },
     "execution_count": 270,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 271,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 窗口切换"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 272,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-272-6c6d5ce6602d>:1: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[1])\n"
     ]
    }
   ],
   "source": [
    "driver.switch_to_window(driver.window_handles[1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 273,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 选项筛选"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 275,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 学术期刊\n",
    "element = driver.find_element_by_xpath('//li[@data-id=\"xsqk\"]').click()\n",
    "# 点击专业检索\n",
    "element = driver.find_element_by_name('majorSearch').click()\n",
    "# all 来源类别\n",
    "element = driver.find_element_by_xpath('//input[@name=\"all\"]').click()\n",
    "# 取消勾选中英文扩展\n",
    "element = driver.find_element_by_xpath('//input[@data-id=\"EN\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 进行检索"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 276,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 设置query\n",
    "query = 'SU = \"计算机\" AND  (TI =\"gis\" OR  TI =\"python\"  OR TI = \"AI\" OR TI = \"big data\")'\n",
    "# 输入关键词\n",
    "element = driver.find_element_by_xpath('//textarea')\n",
    "element.clear()\n",
    "element.send_keys(query)\n",
    "# 点击检索\n",
    "element = driver.find_element_by_xpath('//input[@value=\"检索\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 277,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 检索结果"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 278,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'共找到<em>10,235</em>条结果'"
      ]
     },
     "execution_count": 278,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element=driver.find_element_by_xpath('//span[@class=\"pagerTitleCell\"]')\n",
    "文章数量=element.get_attribute('innerHTML')\n",
    "文章数量"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 279,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 单击显示框"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 280,
   "metadata": {},
   "outputs": [],
   "source": [
    "element=driver.find_element_by_xpath('//i[@class=\"icon icon-sort\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 281,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 选择显示50篇"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 282,
   "metadata": {},
   "outputs": [],
   "source": [
    "element=driver.find_element_by_xpath('//div[@id=\"perPageDiv\"]//li[@data-val=\"50\"]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 283,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 表格第一页"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 284,
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>基于计算机的大数据和云计算技术探析</td>\n",
       "      <td>马珺杰</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>大数据背景下的人工智能在计算机网络技术中的应用研究</td>\n",
       "      <td>王婧; 张学娜</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>大数据时代计算机网络安全防范分析</td>\n",
       "      <td>楚丙奇</td>\n",
       "      <td>办公自动化</td>\n",
       "      <td>2021-07-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究</td>\n",
       "      <td>赵于卓; 黄子莹</td>\n",
       "      <td>中国商论</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>GIS专业自然地理学野外实习的教学改革实践</td>\n",
       "      <td>吴小芳; 钟晓兰; 谢刚生; 何正勇</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>49.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>基于GIS的入侵生物适生区预测——以桔小实蝇为例</td>\n",
       "      <td>张华纬; 赵健; 李志鹏</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-06-24</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>GIS技术在地理空间教学实践中的应用</td>\n",
       "      <td>马炎池</td>\n",
       "      <td>电子技术</td>\n",
       "      <td>2021-06-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>152.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>新工科视域下计算机科学与技术专业大数据方向培养体系探索</td>\n",
       "      <td>李金忠</td>\n",
       "      <td>台州学院学报</td>\n",
       "      <td>2021-06-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>17.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>基于RS和GIS技术的西藏多龙矿集区矿山选址研究</td>\n",
       "      <td>赵龙贤;代晶晶;赵元艺;姜琪;刘婷玥</td>\n",
       "      <td>国土资源遥感</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>大数据时代信息伦理的困境与应对研究</td>\n",
       "      <td>梁宇; 郑易平</td>\n",
       "      <td>科学技术哲学研究</td>\n",
       "      <td>2021-06-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>542.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>基于“BIM+GIS”的运营城市轨道交通安全监测与评估  网络首发</td>\n",
       "      <td>罗海涛</td>\n",
       "      <td>铁道勘察</td>\n",
       "      <td>2021-06-02 17:41</td>\n",
       "      <td>NaN</td>\n",
       "      <td>339.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>安富利携手合作伙伴共同展示AI创新技术及应用</td>\n",
       "      <td>NaN</td>\n",
       "      <td>单片机与嵌入式系统应用</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>基于计算机的大数据和云计算技术分析</td>\n",
       "      <td>秦蓉</td>\n",
       "      <td>数字通信世界</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>大数据背景下的开放教育计算机专业教育改革研究</td>\n",
       "      <td>段超</td>\n",
       "      <td>数字通信世界</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>基于GIS的大藤峡水库泄洪下游淹没影响模拟与分析</td>\n",
       "      <td>吴娟</td>\n",
       "      <td>山西农经</td>\n",
       "      <td>2021-05-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>19.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>基于计算思维的“Python程序设计”课程教学研究</td>\n",
       "      <td>罗平娟; 彭芳策</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>71.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>地理信息系统课程实践教学中改进方法的探究</td>\n",
       "      <td>赵天明</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>80.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>基于GIS的徐州市火灾应急救援系统设计与实现</td>\n",
       "      <td>仲旸; 李保杰; 笪柳炎</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>237.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>GIS技术在城市轨道交通安全监测中的应用研究——以某新建地铁穿越既有地铁安全监测为例</td>\n",
       "      <td>谭磊; 贺美德; 柳飞</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>206.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>基于大数据的设备分析系统研究</td>\n",
       "      <td>王学松; 刘天才</td>\n",
       "      <td>自动化与仪器仪表</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>基于Python的图书馆信息管理系统研发</td>\n",
       "      <td>胡小春; 田婧; 陈燕</td>\n",
       "      <td>信息技术与信息化</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>159.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>计算机软件技术在大数据时代的应用分析</td>\n",
       "      <td>鄢冲</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>14.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>大数据时代下计算机软件技术的应用分析</td>\n",
       "      <td>陈建伟</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>大数据背景下计算机信息技术在网络安全中的运用探析</td>\n",
       "      <td>格桑次仁</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>11.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>大数据背景下高职计算机应用技术移动学习的研究</td>\n",
       "      <td>赵建伟</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>大数据时代下计算机软件技术的应用</td>\n",
       "      <td>李永刚</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>大数据环境在“计算机组装与维护”课程教学改革研究中的应用</td>\n",
       "      <td>程光璇; 刘慧</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>大数据与计算机网络的信息安全策略分析</td>\n",
       "      <td>李培培</td>\n",
       "      <td>电子技术</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>423.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>大数据时代计算机科学与技术专业改造升级路径探索</td>\n",
       "      <td>赵建华; 刘宁</td>\n",
       "      <td>微型电脑应用</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>182.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>工业互联网背景下大数据技术应用与计算机信息管理专业的融合研究</td>\n",
       "      <td>贺宁; 邹晓华; 唐丽萍</td>\n",
       "      <td>江苏科技信息</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>50.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>大数据背景下地方高校人工智能方向人才培养模式探索</td>\n",
       "      <td>叶青; 刘长华</td>\n",
       "      <td>湖北工程学院学报</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>GIS技术在农村饮水安全工程评价系统中的应用</td>\n",
       "      <td>房凯</td>\n",
       "      <td>农业工程</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>基于Python Flask的运维信息管理系统设计与实现</td>\n",
       "      <td>冷四军</td>\n",
       "      <td>电脑编程技巧与维护</td>\n",
       "      <td>2021-05-18</td>\n",
       "      <td>NaN</td>\n",
       "      <td>135.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>面向大数据信息时代计算机科学的应用探析</td>\n",
       "      <td>彭雪</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>111.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>基于大数据时代人工智能在计算机网络技术中的应用</td>\n",
       "      <td>李晓霞</td>\n",
       "      <td>电子测试</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>53.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>浅谈GIS对于开展地理教学的影响</td>\n",
       "      <td>王莉; 阿里木江·卡斯木</td>\n",
       "      <td>科学咨询(教育科研)</td>\n",
       "      <td>2021-05-14</td>\n",
       "      <td>NaN</td>\n",
       "      <td>153.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>大数据在粮库信息化中的应用</td>\n",
       "      <td>刘廷凤; 吴建军</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2021-05-12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>152.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>《大学信息技术（Python程序设计）》基于MOOC的线上线下混合教学模式课程建设研究</td>\n",
       "      <td>陈艳; 吴珍珍</td>\n",
       "      <td>河北农机</td>\n",
       "      <td>2021-05-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>AIPerf：大规模人工智能算力基准测试程序</td>\n",
       "      <td>翟季冬</td>\n",
       "      <td>大数据</td>\n",
       "      <td>2021-05-06 16:32</td>\n",
       "      <td>NaN</td>\n",
       "      <td>69.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>基于stm32系统与物联网的AI多功能门禁系统研究</td>\n",
       "      <td>林佳智;常凤筠;朱文斌;朱瑞昕;张天赐</td>\n",
       "      <td>科学技术创新</td>\n",
       "      <td>2021-05-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>236.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>大数据时代下人工智能在计算机网络技术中的运用探讨</td>\n",
       "      <td>杨文学</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-05-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>38.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>大数据驱动的计算机网络远程教学质量评价研究</td>\n",
       "      <td>云洁; 白雪</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2021-05-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>149.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>基于GIS的城市地下管线信息管理系统研究与实现</td>\n",
       "      <td>孙凯;王青</td>\n",
       "      <td>数字通信世界</td>\n",
       "      <td>2021-05-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>32.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>基于Python Flask的温度数据可视化</td>\n",
       "      <td>胡钊</td>\n",
       "      <td>电子世界</td>\n",
       "      <td>2021-04-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>274.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>大数据在地理信息系统中的应用探索</td>\n",
       "      <td>黄相维</td>\n",
       "      <td>黑龙江水利科技</td>\n",
       "      <td>2021-04-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>123.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>地理信息系统GIS在城市测绘中的应用研究</td>\n",
       "      <td>肖玉勇</td>\n",
       "      <td>智能城市</td>\n",
       "      <td>2021-04-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>309.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>大数据时代网络信息安全及对应策略研究</td>\n",
       "      <td>集世璞</td>\n",
       "      <td>中小企业管理与科技(下旬刊)</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>405.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>基于大数据的计算机专业学生就业方向研究</td>\n",
       "      <td>陈欣; 江悦</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>119.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>GIS与语言学交叉研究</td>\n",
       "      <td>韦韧</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>103.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>基于遥感和地理信息系统的内蒙古呼日查干淖尔地区生态脆弱性评价</td>\n",
       "      <td>周玲美; 王世航; 权玲</td>\n",
       "      <td>生态与农村环境学报</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>274.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                           篇名  \\\n",
       "0            1                            基于计算机的大数据和云计算技术探析   \n",
       "1            2                    大数据背景下的人工智能在计算机网络技术中的应用研究   \n",
       "2            3                             大数据时代计算机网络安全防范分析   \n",
       "3            4                 基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究   \n",
       "4            5                        GIS专业自然地理学野外实习的教学改革实践   \n",
       "5            6                     基于GIS的入侵生物适生区预测——以桔小实蝇为例   \n",
       "6            7                           GIS技术在地理空间教学实践中的应用   \n",
       "7            8                  新工科视域下计算机科学与技术专业大数据方向培养体系探索   \n",
       "8            9                     基于RS和GIS技术的西藏多龙矿集区矿山选址研究   \n",
       "9           10                            大数据时代信息伦理的困境与应对研究   \n",
       "10          11            基于“BIM+GIS”的运营城市轨道交通安全监测与评估  网络首发   \n",
       "11          12                       安富利携手合作伙伴共同展示AI创新技术及应用   \n",
       "12          13                            基于计算机的大数据和云计算技术分析   \n",
       "13          14                       大数据背景下的开放教育计算机专业教育改革研究   \n",
       "14          15                     基于GIS的大藤峡水库泄洪下游淹没影响模拟与分析   \n",
       "15          16                    基于计算思维的“Python程序设计”课程教学研究   \n",
       "16          17                         地理信息系统课程实践教学中改进方法的探究   \n",
       "17          18                       基于GIS的徐州市火灾应急救援系统设计与实现   \n",
       "18          19   GIS技术在城市轨道交通安全监测中的应用研究——以某新建地铁穿越既有地铁安全监测为例   \n",
       "19          20                               基于大数据的设备分析系统研究   \n",
       "20          21                         基于Python的图书馆信息管理系统研发   \n",
       "21          22                           计算机软件技术在大数据时代的应用分析   \n",
       "22          23                           大数据时代下计算机软件技术的应用分析   \n",
       "23          24                     大数据背景下计算机信息技术在网络安全中的运用探析   \n",
       "24          25                       大数据背景下高职计算机应用技术移动学习的研究   \n",
       "25          26                             大数据时代下计算机软件技术的应用   \n",
       "26          27                 大数据环境在“计算机组装与维护”课程教学改革研究中的应用   \n",
       "27          28                           大数据与计算机网络的信息安全策略分析   \n",
       "28          29                      大数据时代计算机科学与技术专业改造升级路径探索   \n",
       "29          30               工业互联网背景下大数据技术应用与计算机信息管理专业的融合研究   \n",
       "30          31                     大数据背景下地方高校人工智能方向人才培养模式探索   \n",
       "31          32                       GIS技术在农村饮水安全工程评价系统中的应用   \n",
       "32          33                 基于Python Flask的运维信息管理系统设计与实现   \n",
       "33          34                          面向大数据信息时代计算机科学的应用探析   \n",
       "34          35                      基于大数据时代人工智能在计算机网络技术中的应用   \n",
       "35          36                             浅谈GIS对于开展地理教学的影响   \n",
       "36          37                                大数据在粮库信息化中的应用   \n",
       "37          38  《大学信息技术（Python程序设计）》基于MOOC的线上线下混合教学模式课程建设研究   \n",
       "38          39                       AIPerf：大规模人工智能算力基准测试程序   \n",
       "39          40                    基于stm32系统与物联网的AI多功能门禁系统研究   \n",
       "40          41                     大数据时代下人工智能在计算机网络技术中的运用探讨   \n",
       "41          42                        大数据驱动的计算机网络远程教学质量评价研究   \n",
       "42          43                      基于GIS的城市地下管线信息管理系统研究与实现   \n",
       "43          44                       基于Python Flask的温度数据可视化   \n",
       "44          45                             大数据在地理信息系统中的应用探索   \n",
       "45          46                         地理信息系统GIS在城市测绘中的应用研究   \n",
       "46          47                           大数据时代网络信息安全及对应策略研究   \n",
       "47          48                          基于大数据的计算机专业学生就业方向研究   \n",
       "48          49                                  GIS与语言学交叉研究   \n",
       "49          50               基于遥感和地理信息系统的内蒙古呼日查干淖尔地区生态脆弱性评价   \n",
       "\n",
       "                     作者              刊名              发表时间  被引     下载  操作  \n",
       "0                   马珺杰  中小企业管理与科技(中旬刊)        2021-07-02 NaN    NaN  下载  \n",
       "1               王婧; 张学娜  中小企业管理与科技(中旬刊)        2021-07-02 NaN    NaN  下载  \n",
       "2                   楚丙奇           办公自动化        2021-07-01 NaN    NaN  下载  \n",
       "3              赵于卓; 黄子莹            中国商论        2021-06-30 NaN    NaN  下载  \n",
       "4    吴小芳; 钟晓兰; 谢刚生; 何正勇            测绘通报        2021-06-25 NaN   49.0  下载  \n",
       "5          张华纬; 赵健; 李志鹏       测绘与空间地理信息        2021-06-24 NaN   64.0  下载  \n",
       "6                   马炎池            电子技术        2021-06-20 NaN  152.0  下载  \n",
       "7                   李金忠          台州学院学报        2021-06-20 NaN   17.0  下载  \n",
       "8    赵龙贤;代晶晶;赵元艺;姜琪;刘婷玥          国土资源遥感        2021-06-15 NaN    9.0  下载  \n",
       "9               梁宇; 郑易平        科学技术哲学研究        2021-06-05 NaN  542.0  下载  \n",
       "10                  罗海涛            铁道勘察  2021-06-02 17:41 NaN  339.0  下载  \n",
       "11                  NaN     单片机与嵌入式系统应用        2021-06-01 NaN    NaN  下载  \n",
       "12                   秦蓉          数字通信世界        2021-06-01 NaN    NaN  下载  \n",
       "13                   段超          数字通信世界        2021-06-01 NaN    NaN  下载  \n",
       "14                   吴娟            山西农经        2021-05-30 NaN   19.0  下载  \n",
       "15             罗平娟; 彭芳策         电脑知识与技术        2021-05-25 NaN   71.0  下载  \n",
       "16                  赵天明       测绘与空间地理信息        2021-05-25 NaN   80.0  下载  \n",
       "17         仲旸; 李保杰; 笪柳炎       测绘与空间地理信息        2021-05-25 NaN  237.0  下载  \n",
       "18          谭磊; 贺美德; 柳飞       测绘与空间地理信息        2021-05-25 NaN  206.0  下载  \n",
       "19             王学松; 刘天才        自动化与仪器仪表        2021-05-25 NaN   24.0  下载  \n",
       "20          胡小春; 田婧; 陈燕        信息技术与信息化        2021-05-25 NaN  159.0  下载  \n",
       "21                   鄢冲         数字技术与应用        2021-05-25 NaN   14.0  下载  \n",
       "22                  陈建伟         数字技术与应用        2021-05-25 NaN    8.0  下载  \n",
       "23                 格桑次仁         数字技术与应用        2021-05-25 NaN   11.0  下载  \n",
       "24                  赵建伟         数字技术与应用        2021-05-25 NaN    3.0  下载  \n",
       "25                  李永刚          无线互联科技        2021-05-25 NaN    NaN  下载  \n",
       "26              程光璇; 刘慧          无线互联科技        2021-05-25 NaN    NaN  下载  \n",
       "27                  李培培            电子技术        2021-05-20 NaN  423.0  下载  \n",
       "28              赵建华; 刘宁          微型电脑应用        2021-05-20 NaN  182.0  下载  \n",
       "29         贺宁; 邹晓华; 唐丽萍          江苏科技信息        2021-05-20 NaN   50.0  下载  \n",
       "30              叶青; 刘长华        湖北工程学院学报        2021-05-20 NaN   61.0  下载  \n",
       "31                   房凯            农业工程        2021-05-20 NaN    1.0  下载  \n",
       "32                  冷四军       电脑编程技巧与维护        2021-05-18 NaN  135.0  下载  \n",
       "33                   彭雪  中小企业管理与科技(中旬刊)        2021-05-15 NaN  111.0  下载  \n",
       "34                  李晓霞            电子测试        2021-05-15 NaN   53.0  下载  \n",
       "35         王莉; 阿里木江·卡斯木      科学咨询(教育科研)        2021-05-14 NaN  153.0  下载  \n",
       "36             刘廷凤; 吴建军          现代电子技术        2021-05-12 NaN  152.0  下载  \n",
       "37              陈艳; 吴珍珍            河北农机        2021-05-10 NaN   33.0  下载  \n",
       "38                  翟季冬             大数据  2021-05-06 16:32 NaN   69.0  下载  \n",
       "39  林佳智;常凤筠;朱文斌;朱瑞昕;张天赐          科学技术创新        2021-05-05 NaN  236.0  下载  \n",
       "40                  杨文学         电脑知识与技术        2021-05-05 NaN   38.0  下载  \n",
       "41               云洁; 白雪          现代电子技术        2021-05-01 NaN  149.0  下载  \n",
       "42                孙凯;王青          数字通信世界        2021-05-01 NaN   32.0  下载  \n",
       "43                   胡钊            电子世界        2021-04-30 NaN  274.0  下载  \n",
       "44                  黄相维         黑龙江水利科技        2021-04-30 NaN  123.0  下载  \n",
       "45                  肖玉勇            智能城市        2021-04-28 NaN  309.0  下载  \n",
       "46                  集世璞  中小企业管理与科技(下旬刊)        2021-04-25 NaN  405.0  下载  \n",
       "47               陈欣; 江悦         电脑知识与技术        2021-04-25 NaN  119.0  下载  \n",
       "48                   韦韧            测绘通报        2021-04-25 NaN  103.0  下载  \n",
       "49         周玲美; 王世航; 权玲       生态与农村环境学报        2021-04-25 NaN  274.0  下载  "
      ]
     },
     "execution_count": 284,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element=driver.find_element_by_id('gridTable')\n",
    "第一页页面信息_HTML=element.get_attribute('innerHTML')\n",
    "第一页页面信息_HTML\n",
    "df_第一页页面表格=pd.read_html(第一页页面信息_HTML)[0]\n",
    "df_第一页页面表格"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 285,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 获取详细页的链接并与基本信息表格合并"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 286,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 获取详详情页链接\n",
    "html = driver.page_source\n",
    "root = fromstring(html)\n",
    "href = [x for x in root.xpath('.//*[@id=\"gridTable\"]/table/tbody/tr/td[2]/a/@href')]\n",
    "\n",
    "def correct(href):\n",
    "    DbCode = re.findall(\"DbCode=(.*?)&\",href)[0]\n",
    "    dbname = re.findall(\"dbname=(.*?)&\",href)[0]\n",
    "    filename = re.findall(\"filename=(.*?)&\",href)[0]\n",
    "    href = f\"https://kns.cnki.net/kcms/detail/detail.aspx?dbcode={DbCode}&dbname={dbname}&filename={filename}\"\n",
    "    return href"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 287,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详情页链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>基于计算机的大数据和云计算技术探析</td>\n",
       "      <td>马珺杰</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>大数据背景下的人工智能在计算机网络技术中的应用研究</td>\n",
       "      <td>王婧; 张学娜</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>大数据时代计算机网络安全防范分析</td>\n",
       "      <td>楚丙奇</td>\n",
       "      <td>办公自动化</td>\n",
       "      <td>2021-07-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究</td>\n",
       "      <td>赵于卓; 黄子莹</td>\n",
       "      <td>中国商论</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>GIS专业自然地理学野外实习的教学改革实践</td>\n",
       "      <td>吴小芳; 钟晓兰; 谢刚生; 何正勇</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>49.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>基于GIS的入侵生物适生区预测——以桔小实蝇为例</td>\n",
       "      <td>张华纬; 赵健; 李志鹏</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-06-24</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>GIS技术在地理空间教学实践中的应用</td>\n",
       "      <td>马炎池</td>\n",
       "      <td>电子技术</td>\n",
       "      <td>2021-06-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>152.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>新工科视域下计算机科学与技术专业大数据方向培养体系探索</td>\n",
       "      <td>李金忠</td>\n",
       "      <td>台州学院学报</td>\n",
       "      <td>2021-06-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>17.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>基于RS和GIS技术的西藏多龙矿集区矿山选址研究</td>\n",
       "      <td>赵龙贤;代晶晶;赵元艺;姜琪;刘婷玥</td>\n",
       "      <td>国土资源遥感</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>大数据时代信息伦理的困境与应对研究</td>\n",
       "      <td>梁宇; 郑易平</td>\n",
       "      <td>科学技术哲学研究</td>\n",
       "      <td>2021-06-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>542.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>基于“BIM+GIS”的运营城市轨道交通安全监测与评估  网络首发</td>\n",
       "      <td>罗海涛</td>\n",
       "      <td>铁道勘察</td>\n",
       "      <td>2021-06-02 17:41</td>\n",
       "      <td>NaN</td>\n",
       "      <td>339.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>安富利携手合作伙伴共同展示AI创新技术及应用</td>\n",
       "      <td>NaN</td>\n",
       "      <td>单片机与嵌入式系统应用</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>基于计算机的大数据和云计算技术分析</td>\n",
       "      <td>秦蓉</td>\n",
       "      <td>数字通信世界</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>大数据背景下的开放教育计算机专业教育改革研究</td>\n",
       "      <td>段超</td>\n",
       "      <td>数字通信世界</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>基于GIS的大藤峡水库泄洪下游淹没影响模拟与分析</td>\n",
       "      <td>吴娟</td>\n",
       "      <td>山西农经</td>\n",
       "      <td>2021-05-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>19.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>基于计算思维的“Python程序设计”课程教学研究</td>\n",
       "      <td>罗平娟; 彭芳策</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>71.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>地理信息系统课程实践教学中改进方法的探究</td>\n",
       "      <td>赵天明</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>80.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>基于GIS的徐州市火灾应急救援系统设计与实现</td>\n",
       "      <td>仲旸; 李保杰; 笪柳炎</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>237.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>GIS技术在城市轨道交通安全监测中的应用研究——以某新建地铁穿越既有地铁安全监测为例</td>\n",
       "      <td>谭磊; 贺美德; 柳飞</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>206.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>基于大数据的设备分析系统研究</td>\n",
       "      <td>王学松; 刘天才</td>\n",
       "      <td>自动化与仪器仪表</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>基于Python的图书馆信息管理系统研发</td>\n",
       "      <td>胡小春; 田婧; 陈燕</td>\n",
       "      <td>信息技术与信息化</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>159.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>计算机软件技术在大数据时代的应用分析</td>\n",
       "      <td>鄢冲</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>14.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>大数据时代下计算机软件技术的应用分析</td>\n",
       "      <td>陈建伟</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>大数据背景下计算机信息技术在网络安全中的运用探析</td>\n",
       "      <td>格桑次仁</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>11.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>大数据背景下高职计算机应用技术移动学习的研究</td>\n",
       "      <td>赵建伟</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>大数据时代下计算机软件技术的应用</td>\n",
       "      <td>李永刚</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>大数据环境在“计算机组装与维护”课程教学改革研究中的应用</td>\n",
       "      <td>程光璇; 刘慧</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>大数据与计算机网络的信息安全策略分析</td>\n",
       "      <td>李培培</td>\n",
       "      <td>电子技术</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>423.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>大数据时代计算机科学与技术专业改造升级路径探索</td>\n",
       "      <td>赵建华; 刘宁</td>\n",
       "      <td>微型电脑应用</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>182.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>工业互联网背景下大数据技术应用与计算机信息管理专业的融合研究</td>\n",
       "      <td>贺宁; 邹晓华; 唐丽萍</td>\n",
       "      <td>江苏科技信息</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>50.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>大数据背景下地方高校人工智能方向人才培养模式探索</td>\n",
       "      <td>叶青; 刘长华</td>\n",
       "      <td>湖北工程学院学报</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>GIS技术在农村饮水安全工程评价系统中的应用</td>\n",
       "      <td>房凯</td>\n",
       "      <td>农业工程</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>基于Python Flask的运维信息管理系统设计与实现</td>\n",
       "      <td>冷四军</td>\n",
       "      <td>电脑编程技巧与维护</td>\n",
       "      <td>2021-05-18</td>\n",
       "      <td>NaN</td>\n",
       "      <td>135.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>面向大数据信息时代计算机科学的应用探析</td>\n",
       "      <td>彭雪</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>111.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>基于大数据时代人工智能在计算机网络技术中的应用</td>\n",
       "      <td>李晓霞</td>\n",
       "      <td>电子测试</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>53.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>浅谈GIS对于开展地理教学的影响</td>\n",
       "      <td>王莉; 阿里木江·卡斯木</td>\n",
       "      <td>科学咨询(教育科研)</td>\n",
       "      <td>2021-05-14</td>\n",
       "      <td>NaN</td>\n",
       "      <td>153.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>大数据在粮库信息化中的应用</td>\n",
       "      <td>刘廷凤; 吴建军</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2021-05-12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>152.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>《大学信息技术（Python程序设计）》基于MOOC的线上线下混合教学模式课程建设研究</td>\n",
       "      <td>陈艳; 吴珍珍</td>\n",
       "      <td>河北农机</td>\n",
       "      <td>2021-05-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>AIPerf：大规模人工智能算力基准测试程序</td>\n",
       "      <td>翟季冬</td>\n",
       "      <td>大数据</td>\n",
       "      <td>2021-05-06 16:32</td>\n",
       "      <td>NaN</td>\n",
       "      <td>69.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>基于stm32系统与物联网的AI多功能门禁系统研究</td>\n",
       "      <td>林佳智;常凤筠;朱文斌;朱瑞昕;张天赐</td>\n",
       "      <td>科学技术创新</td>\n",
       "      <td>2021-05-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>236.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>大数据时代下人工智能在计算机网络技术中的运用探讨</td>\n",
       "      <td>杨文学</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-05-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>38.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>大数据驱动的计算机网络远程教学质量评价研究</td>\n",
       "      <td>云洁; 白雪</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2021-05-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>149.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>基于GIS的城市地下管线信息管理系统研究与实现</td>\n",
       "      <td>孙凯;王青</td>\n",
       "      <td>数字通信世界</td>\n",
       "      <td>2021-05-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>32.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>基于Python Flask的温度数据可视化</td>\n",
       "      <td>胡钊</td>\n",
       "      <td>电子世界</td>\n",
       "      <td>2021-04-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>274.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>大数据在地理信息系统中的应用探索</td>\n",
       "      <td>黄相维</td>\n",
       "      <td>黑龙江水利科技</td>\n",
       "      <td>2021-04-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>123.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>地理信息系统GIS在城市测绘中的应用研究</td>\n",
       "      <td>肖玉勇</td>\n",
       "      <td>智能城市</td>\n",
       "      <td>2021-04-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>309.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>大数据时代网络信息安全及对应策略研究</td>\n",
       "      <td>集世璞</td>\n",
       "      <td>中小企业管理与科技(下旬刊)</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>405.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>基于大数据的计算机专业学生就业方向研究</td>\n",
       "      <td>陈欣; 江悦</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>119.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>GIS与语言学交叉研究</td>\n",
       "      <td>韦韧</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>103.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>基于遥感和地理信息系统的内蒙古呼日查干淖尔地区生态脆弱性评价</td>\n",
       "      <td>周玲美; 王世航; 权玲</td>\n",
       "      <td>生态与农村环境学报</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>274.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                           篇名  \\\n",
       "0            1                            基于计算机的大数据和云计算技术探析   \n",
       "1            2                    大数据背景下的人工智能在计算机网络技术中的应用研究   \n",
       "2            3                             大数据时代计算机网络安全防范分析   \n",
       "3            4                 基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究   \n",
       "4            5                        GIS专业自然地理学野外实习的教学改革实践   \n",
       "5            6                     基于GIS的入侵生物适生区预测——以桔小实蝇为例   \n",
       "6            7                           GIS技术在地理空间教学实践中的应用   \n",
       "7            8                  新工科视域下计算机科学与技术专业大数据方向培养体系探索   \n",
       "8            9                     基于RS和GIS技术的西藏多龙矿集区矿山选址研究   \n",
       "9           10                            大数据时代信息伦理的困境与应对研究   \n",
       "10          11            基于“BIM+GIS”的运营城市轨道交通安全监测与评估  网络首发   \n",
       "11          12                       安富利携手合作伙伴共同展示AI创新技术及应用   \n",
       "12          13                            基于计算机的大数据和云计算技术分析   \n",
       "13          14                       大数据背景下的开放教育计算机专业教育改革研究   \n",
       "14          15                     基于GIS的大藤峡水库泄洪下游淹没影响模拟与分析   \n",
       "15          16                    基于计算思维的“Python程序设计”课程教学研究   \n",
       "16          17                         地理信息系统课程实践教学中改进方法的探究   \n",
       "17          18                       基于GIS的徐州市火灾应急救援系统设计与实现   \n",
       "18          19   GIS技术在城市轨道交通安全监测中的应用研究——以某新建地铁穿越既有地铁安全监测为例   \n",
       "19          20                               基于大数据的设备分析系统研究   \n",
       "20          21                         基于Python的图书馆信息管理系统研发   \n",
       "21          22                           计算机软件技术在大数据时代的应用分析   \n",
       "22          23                           大数据时代下计算机软件技术的应用分析   \n",
       "23          24                     大数据背景下计算机信息技术在网络安全中的运用探析   \n",
       "24          25                       大数据背景下高职计算机应用技术移动学习的研究   \n",
       "25          26                             大数据时代下计算机软件技术的应用   \n",
       "26          27                 大数据环境在“计算机组装与维护”课程教学改革研究中的应用   \n",
       "27          28                           大数据与计算机网络的信息安全策略分析   \n",
       "28          29                      大数据时代计算机科学与技术专业改造升级路径探索   \n",
       "29          30               工业互联网背景下大数据技术应用与计算机信息管理专业的融合研究   \n",
       "30          31                     大数据背景下地方高校人工智能方向人才培养模式探索   \n",
       "31          32                       GIS技术在农村饮水安全工程评价系统中的应用   \n",
       "32          33                 基于Python Flask的运维信息管理系统设计与实现   \n",
       "33          34                          面向大数据信息时代计算机科学的应用探析   \n",
       "34          35                      基于大数据时代人工智能在计算机网络技术中的应用   \n",
       "35          36                             浅谈GIS对于开展地理教学的影响   \n",
       "36          37                                大数据在粮库信息化中的应用   \n",
       "37          38  《大学信息技术（Python程序设计）》基于MOOC的线上线下混合教学模式课程建设研究   \n",
       "38          39                       AIPerf：大规模人工智能算力基准测试程序   \n",
       "39          40                    基于stm32系统与物联网的AI多功能门禁系统研究   \n",
       "40          41                     大数据时代下人工智能在计算机网络技术中的运用探讨   \n",
       "41          42                        大数据驱动的计算机网络远程教学质量评价研究   \n",
       "42          43                      基于GIS的城市地下管线信息管理系统研究与实现   \n",
       "43          44                       基于Python Flask的温度数据可视化   \n",
       "44          45                             大数据在地理信息系统中的应用探索   \n",
       "45          46                         地理信息系统GIS在城市测绘中的应用研究   \n",
       "46          47                           大数据时代网络信息安全及对应策略研究   \n",
       "47          48                          基于大数据的计算机专业学生就业方向研究   \n",
       "48          49                                  GIS与语言学交叉研究   \n",
       "49          50               基于遥感和地理信息系统的内蒙古呼日查干淖尔地区生态脆弱性评价   \n",
       "\n",
       "                     作者              刊名              发表时间  被引     下载  操作  \\\n",
       "0                   马珺杰  中小企业管理与科技(中旬刊)        2021-07-02 NaN    NaN  下载   \n",
       "1               王婧; 张学娜  中小企业管理与科技(中旬刊)        2021-07-02 NaN    NaN  下载   \n",
       "2                   楚丙奇           办公自动化        2021-07-01 NaN    NaN  下载   \n",
       "3              赵于卓; 黄子莹            中国商论        2021-06-30 NaN    NaN  下载   \n",
       "4    吴小芳; 钟晓兰; 谢刚生; 何正勇            测绘通报        2021-06-25 NaN   49.0  下载   \n",
       "5          张华纬; 赵健; 李志鹏       测绘与空间地理信息        2021-06-24 NaN   64.0  下载   \n",
       "6                   马炎池            电子技术        2021-06-20 NaN  152.0  下载   \n",
       "7                   李金忠          台州学院学报        2021-06-20 NaN   17.0  下载   \n",
       "8    赵龙贤;代晶晶;赵元艺;姜琪;刘婷玥          国土资源遥感        2021-06-15 NaN    9.0  下载   \n",
       "9               梁宇; 郑易平        科学技术哲学研究        2021-06-05 NaN  542.0  下载   \n",
       "10                  罗海涛            铁道勘察  2021-06-02 17:41 NaN  339.0  下载   \n",
       "11                  NaN     单片机与嵌入式系统应用        2021-06-01 NaN    NaN  下载   \n",
       "12                   秦蓉          数字通信世界        2021-06-01 NaN    NaN  下载   \n",
       "13                   段超          数字通信世界        2021-06-01 NaN    NaN  下载   \n",
       "14                   吴娟            山西农经        2021-05-30 NaN   19.0  下载   \n",
       "15             罗平娟; 彭芳策         电脑知识与技术        2021-05-25 NaN   71.0  下载   \n",
       "16                  赵天明       测绘与空间地理信息        2021-05-25 NaN   80.0  下载   \n",
       "17         仲旸; 李保杰; 笪柳炎       测绘与空间地理信息        2021-05-25 NaN  237.0  下载   \n",
       "18          谭磊; 贺美德; 柳飞       测绘与空间地理信息        2021-05-25 NaN  206.0  下载   \n",
       "19             王学松; 刘天才        自动化与仪器仪表        2021-05-25 NaN   24.0  下载   \n",
       "20          胡小春; 田婧; 陈燕        信息技术与信息化        2021-05-25 NaN  159.0  下载   \n",
       "21                   鄢冲         数字技术与应用        2021-05-25 NaN   14.0  下载   \n",
       "22                  陈建伟         数字技术与应用        2021-05-25 NaN    8.0  下载   \n",
       "23                 格桑次仁         数字技术与应用        2021-05-25 NaN   11.0  下载   \n",
       "24                  赵建伟         数字技术与应用        2021-05-25 NaN    3.0  下载   \n",
       "25                  李永刚          无线互联科技        2021-05-25 NaN    NaN  下载   \n",
       "26              程光璇; 刘慧          无线互联科技        2021-05-25 NaN    NaN  下载   \n",
       "27                  李培培            电子技术        2021-05-20 NaN  423.0  下载   \n",
       "28              赵建华; 刘宁          微型电脑应用        2021-05-20 NaN  182.0  下载   \n",
       "29         贺宁; 邹晓华; 唐丽萍          江苏科技信息        2021-05-20 NaN   50.0  下载   \n",
       "30              叶青; 刘长华        湖北工程学院学报        2021-05-20 NaN   61.0  下载   \n",
       "31                   房凯            农业工程        2021-05-20 NaN    1.0  下载   \n",
       "32                  冷四军       电脑编程技巧与维护        2021-05-18 NaN  135.0  下载   \n",
       "33                   彭雪  中小企业管理与科技(中旬刊)        2021-05-15 NaN  111.0  下载   \n",
       "34                  李晓霞            电子测试        2021-05-15 NaN   53.0  下载   \n",
       "35         王莉; 阿里木江·卡斯木      科学咨询(教育科研)        2021-05-14 NaN  153.0  下载   \n",
       "36             刘廷凤; 吴建军          现代电子技术        2021-05-12 NaN  152.0  下载   \n",
       "37              陈艳; 吴珍珍            河北农机        2021-05-10 NaN   33.0  下载   \n",
       "38                  翟季冬             大数据  2021-05-06 16:32 NaN   69.0  下载   \n",
       "39  林佳智;常凤筠;朱文斌;朱瑞昕;张天赐          科学技术创新        2021-05-05 NaN  236.0  下载   \n",
       "40                  杨文学         电脑知识与技术        2021-05-05 NaN   38.0  下载   \n",
       "41               云洁; 白雪          现代电子技术        2021-05-01 NaN  149.0  下载   \n",
       "42                孙凯;王青          数字通信世界        2021-05-01 NaN   32.0  下载   \n",
       "43                   胡钊            电子世界        2021-04-30 NaN  274.0  下载   \n",
       "44                  黄相维         黑龙江水利科技        2021-04-30 NaN  123.0  下载   \n",
       "45                  肖玉勇            智能城市        2021-04-28 NaN  309.0  下载   \n",
       "46                  集世璞  中小企业管理与科技(下旬刊)        2021-04-25 NaN  405.0  下载   \n",
       "47               陈欣; 江悦         电脑知识与技术        2021-04-25 NaN  119.0  下载   \n",
       "48                   韦韧            测绘通报        2021-04-25 NaN  103.0  下载   \n",
       "49         周玲美; 王世航; 权玲       生态与农村环境学报        2021-04-25 NaN  274.0  下载   \n",
       "\n",
       "                                                详情页链接  \n",
       "0   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "1   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "2   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "3   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "4   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "5   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "6   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "7   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "8   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "9   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "10  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "11  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "12  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "13  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "14  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "15  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "16  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "17  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "18  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "19  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "20  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "21  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "22  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "23  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "24  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "25  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "26  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "27  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "28  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "29  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "30  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "31  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "32  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "33  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "34  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "35  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "36  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "37  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "38  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "39  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "40  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "41  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "42  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "43  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "44  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "45  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "46  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "47  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "48  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "49  https://kns.cnki.net/kcms/detail/detail.aspx?d...  "
      ]
     },
     "execution_count": 287,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "links=[]\n",
    "\n",
    "for link in href:\n",
    "    link=correct(link)\n",
    "    links.append(link)\n",
    "    df_links=pd.DataFrame({'详情页链接':links})\n",
    "    df_首页=pd.concat([pd.read_html(第一页页面信息_HTML)[0],df_links],axis=1)\n",
    "\n",
    "df_首页"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 288,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 获取详细页面中的PDF下载链接"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 289,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['/kcms/download.aspx?filename=mR4oGORl3K0YTS5YmMKVzatRDbtN3bZB3RylGWjlmY1okZI9CW3EDWrE2Uz0WbYJHeJNmYqJmRvF1Q=0DNQ5ERpNEeWJ1KQ52VoF3NwhUYMV1L5oWSHRlUWhUT55mWFlmQ2IXOsVjNvZTZFF1LslTZxwEdpd&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=UVmpGSP52TPl0MCNWSUBXdzUVaux0M28UZwIldUxmbWJ0dNlzUxc3QSNnS2IXTHVXUxR1blhWanhXU=0TS3lmTGpVUXZnWOlVQvkGe5d2cNl2UTJXblZ3Khl3d2FTQ2hDay8iUzo3btVVYB9kNit0UFxEW21&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=UVmpGSP52TPl0MCNWSUBXdzUVaux0M28UZwIldUxmbWJ0dNlzUxc3QSNnS2IXTHVXUxR1blhWanhXU=0zbJl1bCVDUlZmcGtyQMR1a3IXbjZDOnplclZ3Khl3d2FTQ2hDay8iUzo3btVVYB9kNit0UFxEW21&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=neMtGOtxUZxwUbNdDMZJTVLRFc5U1KGBjVPtkNnN1YrBjUX9WY18SSMJzTZRmU1syZSVEaGJ0TKlGV=0TWk9kRxYEVWlFW5k3SkRWd1Y0Nj9yQ0NnSIN0Q4NWZidWTvBTTLBjeD50aFFkaOFVeVFkdXRWVmZ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=HZmRjTiBlTGF1YHNDMKZzRllmU4AjbIRWTvklUQhXZys0ZHN0UTlzNGJzbQdUQwkGRD9mWnNFdkt0V=0zZLhTdyADUFtWVwQESoVWbTtWV3ImcMZlbLV2LThld1J2Qih1QLRndOlFZ1BlZ15keYh0NSJEZDp&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=TSvEEVWhzcxpHc0c3StVnSDJlNZR0VNlHTLpkVSd0VQRVdIB3VWJFU2JWV1l0a4lVQlh2UHRWWGVnW=0TR5cka0RjWu1WW5MWSyMFbitEZ6N1K3AndFNnQIVVSyIEUMpWe5N1T3MlZxRmY3ZnQZ1UU0QEdQR&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=TSvEEVWhzcxpHc0c3StVnSDJlNZR0VNlHTLpkVSd0VQRVdIB3VWJFU2JWV1l0a4lVQlh2UHRWWGVnW=0DNxcUZZhzRGR1RvhlSytCU2YUVyIDSxBndFNnQIVVSyIEUMpWe5N1T3MlZxRmY3ZnQZ1UU0QEdQR&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=lQThUNH5WN58CbKhFN2okcFRleBJDSlJFbsV0KuBzcsdzTLtERVRzQ4pETNBVONJWYwM1SoZXTaZGZ=0TQv50Yz92ayVTSWhVdlZDZ4UndaNGUFVVdltyUTZHSxkEcw0URUFkb6JWeHdDast0UwJWWZZTRmp&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=0VW9maClGOvp1SRxUaOdUaGhETXBHMCZjNQtUewolTwI0RuBVbml1cpZjYrlmRz8GZsRERJ9kcCh0Z=0zcRpkbkJXbvoEaxIHVr4GT0Y0NGZEVyQGV3UWYUNDN4JTR2YlVxMkdiR3dGNDVE1me5h0VUVVYqd&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=qd0VW9maClGOvp1SRxUaOdUaGhETXBHMCZjNQtUewolTwI0RuBVbml1cpZjYrlmRz8GZsRERJ9kcCh0Zj52b6F1Vj5GTz92aHl0Mzl1VKdDTEJkdzxUeORVcrZTU0NXRyJGMphGbxMkdiR3dGNDVE1me5h0VUVVY&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FhjT4JzatNmajNUdW9ENih3RBJEO510R4cHeq1EROBnUntyVENXaz9WRENlWXZmbvAzV24mdhp1VWNnaxRGUSJGTS12ZhxUN5x2SRlXQJRXc3RnVqB3TodjN0VVWIVlR4gUYndVTBVWO2V2U3plaZh2VMJUWQhHb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FeKh1cYNzYQ5URWFXcwNmarsGVys2RSx0NHNkZaRjNz1EMwJnaLpERE5mco5WY4BlSVllbCJ3SxNWb=0TRW10caFkSvdlT0YkVxlGRZpmaTRDWYJDeaBzMttUTXlWa6RVbmVWYwhHWk1UShdnNuJ2Tih3UyZ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FU5NmQiNEN1w0QSZEWz0mSEFDdENlav52NVpkUrFnVwhnYsVWTsFlWMp0K25kYu90QCp0ZjtEcTVUc=0zZjpkZIF3RQRmUVlEOGVTVZFmTNRUYLd2Ui1mZ09icWZWQBVzdspGcNh1LOF1LSd0QWtGO3kGRul&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FU5NmQiNEN1w0QSZEWz0mSEFDdENlav52NVpkUrFnVwhnYsVWTsFlWMp0K25kYu90QCp0ZjtEcTVUc=0DMClDajJHSQRmUVlEOGVTVZFmTNRUYLd2Ui1mZ09icWZWQBVzdspGcNh1LOF1LSd0QWtGO3kGRul&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=ElVV182SxQWNyUWNEZzM4hkVWNVQCVVbVl2SWFDTshWV5UGSBJnYURHTtlVN6RkQ380MIRXUENWVtBHdEJWQl9EawFFVUpHRJdGUZd3NOBzU5gWcSpndvh2KVh3QOVXUvATbmdnN4R1NVdnRM5EV0BlcXVTV0V2R&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=idVQmtketNUZLVGc1cGaL5WZmx0auh3bDV2KBFTTxMTV0JGOQtSS2FUYvR2NGpGWuFXWwVmSk5mQPp1dltiQrAFSzEVSzEjYnd3aDJmT2MUN4UHcrEWdVpHZaZlQx82MqRlUMJUSRRHMolFNzIGSTJ2NzQnbiNWd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=idVQmtketNUZLVGc1cGaL5WZmx0auh3bDV2KBFTTxMTV0JGOQtSS2FUYvR2NGpGWuFXWwVmSk5mQPp1dqp0RycGSykUYTpWdk9mZwFVVY9SW0NHdlV0aJZVVSJHezdnTxFkQrYzNURHMolFNzIGSTJ2NzQnbiNWd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=sd3QQRXUWNnSEtkR1Z0RYljN08mSWhFTlRUNzhUWIBzMEd1VDt2MWhWdYBnb3J1RxJVRrAlQFdkbpNkeI5Wca9EVZ9iWN9EUwZGRvJTS1B3aV1kUlBVWMhnYwUTUHJkUO5WUw82M1RXMI1WZkZzL4ZHT2lGO0EHd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=sd3QQRXUWNnSEtkR1Z0RYljN08mSWhFTlRUNzhUWIBzMEd1VDt2MWhWdYBnb3J1RxJVRrAlQFdkbpNkeZZmdXBFVZ9iWN9EUwZGRvJTS1B3aV1kUlBVWMhnYwUTUHJkUO5WUw82M1RXMI1WZkZzL4ZHT2lGO0EHd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=ZZlM5x0K2lnVDZHa4oFTshjd240YS9Eb35mSxxEdOZlSSlVWiREM2A1cHJ0ZXlETuFVU2JUdml1UL1GRudjN44kMPFFTVFkMKRGMhR2TalzQ4EFdZJEO2Jkb1pVYBRXNpVzQYlTS3FmcUF3ROhTWjZjeBpkbvgFc&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=GaTlWQOZHezEEUV9ib5YkQttUOkdGTMV2Z2dURMhjWSdzMNh2dpVnWGpEchhVMqdFMCtWbHpWemd1R=0zdoRnYFV2Vxh2ZKhGZ5h1MKNUcNpnRRhjMzh0dUdmVzlmS4RGZkNVb0R2NNZXN4QHevkjU5Ukc2E&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=DZUxEaJ9Wd4JkbCB1YT9CZMt0bxl0L21EarxUQ2o3Z3UVRCtGezQFT5pHOq10bQ9UNzpWSChnYYdHV=0zaz4WYwkVU540dPxGZhZ1TEZna5M0YaZncBR0MzFUaOdVW5w0N6BFW4EmcFZGSkJGa1U2bpRENml&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=DZUxEaJ9Wd4JkbCB1YT9CZMt0bxl0L21EarxUQ2o3Z3UVRCtGezQFT5pHOq10bQ9UNzpWSChnYYdHV=0za5xUNxkVU540dPxGZhZ1TEZna5M0YaZncBR0MzFUaOdVW5w0N6BFW4EmcFZGSkJGa1U2bpRENml&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=TTzVzNsBzKTt0ZNNzLntWSYdlZ0kDSldXSQZlUDJ3Z3x0LLp1MxgTYvtCWC1mcJVUdHVlQiF1Ryd2V=0TQTRFb4JUcyAFaxRjWvVnUuFlVZFnUyJkVORjWQ9yYmNHdhtyQIdFdDJETrYUd5YVO6JlRaVFS0k&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=TTzVzNsBzKTt0ZNNzLntWSYdlZ0kDSldXSQZlUDJ3Z3x0LLp1MxgTYvtCWC1mcJVUdHVlQiF1Ryd2V=0DNqhTe4JUcyAFaxRjWvVnUuFlVZFnUyJkVORjWQ9yYmNHdhtyQIdFdDJETrYUd5YVO6JlRaVFS0k&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=VMZdGdyZUMPtie4wWeK9EcJl3ZwU1VuZVcvYTVxcXUQdnWaNjTxtEUNd1KKhVM3cXShBHZkRnWvRHZ=0TWMBlZ39kNJdFOphVZXNHVOFGdJRUYwBDT4kGTEtieOJDURh0T2hkcK12brFUMrRVSn1kNuZ3S1o&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=VMZdGdyZUMPtie4wWeK9EcJl3ZwU1VuZVcvYTVxcXUQdnWaNjTxtEUNd1KKhVM3cXShBHZkRnWvRHZ=0zYihke49kNJdFOphVZXNHVOFGdJRUYwBDT4kGTEtieOJDURh0T2hkcK12brFUMrRVSn1kNuZ3S1o&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=ztkZolEdPNjZv9GUaJ2VTFWYJRzKuFFOzMleiNTcBdjaPdDTXhESzpUTJxWY4JETkV3NzF2VExURRV2ZDFjYtRnSRticyYUMu90MGh3by5ENxEnWspkc3Vnb4kke4lDSyJmSZhjTqZnY2oUc2p2V50GVthmWrtWe&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=NJ0bZNGTZtiSWFHU5NlQER0M3lXdyw2R4wUVlZFN5tSYOFnQtRndGJVa3FFerIjYrQDexdHS49GWNJnboVmenlGNaR2R5oXcRhDNxhkRVtGSwAnWIdlNvEzVzg2SyQzdhlGaUZmQOl0UxkVUyZXY3ZHeygGRpVlS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=NJ0bZNGTZtiSWFHU5NlQER0M3lXdyw2R4wUVlZFN5tSYOFnQtRndGJVa3FFerIjYrQDexdHS49GWNJnboR3K082LmdEd5dWZ4IzRrFXWV9CWCp0dPJGR2RmUUNWYo5mcWtSbQx2SOl0UxkVUyZXY3ZHeygGRpVlS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=2gGd0gmUK52S5JmM15GW4xUe4dkdLhlMKZ0UkRmNHFkUxoHaGRFahNHTaBVW4IjNmFURydmeZh0QnJWcHNjQN1URT1kSMZFOvolZnJkZzwGR5VnaulVRJ5WSQZ3K6tmRD90Sz00TqJXenh0Y390Vvo1NPVnMkhDc&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=0MNhWQBlmRkNkeZplMUx2L5BnYR5UN4RzTFR2LSVUbHRTOjFkeyY0Ka90UohGZK5mUkp1c5NFaKxEd=0TQrg1TaJVSmBFNpJXVL9WOw0WdqJkNhJmaWpGRwsWbrNjZwgEazIUdLdGakNFdBF3K3JEcDZFcyE&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=QFUZhZ2YUhGaINFd5B3MpZVQlhUMnZGeZR1cPFzZ55EZTZmZ4FTbxVjVDpkTrMlWyR0ait0aatmVk92dYVnTmVDehF0KrVWZR5URKdkQzk2d0NVTZVTTUh2btZnaMp1Vw40VZpFcNplTG5kV3IXRLd3ZJZFc4EVS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=DN3SZBnWyJHbxcHV3gkZwAlWYJ0S1hUY1ZWc0hkVRFTNzAHdrNHM1g3ULhkbl1GUnN2RIZmVhZlZapEROhlRGRDM4kFT4hHaZFnSRJVMEV1a5sGcDplQFd3K18WVLl3TwMUYJ12cxlzT1UzdBdUavQWcPR2dQhVe&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=DN3SZBnWyJHbxcHV3gkZwAlWYJ0S1hUY1ZWc0hkVRFTNzAHdrNHM1g3ULhkbl1GUnN2RIZmVhZlZapERxUFWrkXdYNVVa9yanFUTuhHOUR1aktSSBZXY1ZEeiJUOuFmR1kzR5cnNxlzT1UzdBdUavQWcPR2dQhVe&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=RB1S6Fna5M0MzMEdVR1QahEN48WRq5WRnxUQLFzMu5UcwtWbYdXVyZzTQp2NyIldwYzKpFlTCdGT0x2RLN0YKRjVklVRpNmWrA1TPtES2M1Q2dja090UVl1M6NUUUNkYpx2QVRWTv9mQLlWRqZzbnNzcOhTSntSR&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=RB1S6Fna5M0MzMEdVR1QahEN48WRq5WRnxUQLFzMu5UcwtWbYdXVyZzTQp2NyIldwYzKpFlTCdGT0x2R3RWTEBXe5RWeTFXd5NVTmtGeRVUUKd3bnxEWipnZvUXdkpXSEF2UPB1Vv9mQLlWRqZzbnNzcOhTSntSR&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=WN0RP10dXJGV3BjZBVnS4ImRLVHM4BHV0MGU3QnRvlWVa1kVKJHZmd2Vx5kM18We6ZzTHJUejlXeXZ1SQ9UYZFnZtllQKFzTidlcC1EVSZTWyIWMrp1YvIjMPxmcJxkQSlVZTRjUINWR0olZBlUdklUb5FHWr4Ue&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=WN0RP10dXJGV3BjZBVnS4ImRLVHM4BHV0MGU3QnRvlWVa1kVKJHZmd2Vx5kM18We6ZzTHJUejlXeXZ1SKZ1bvY0SLZFbodDNTxUQChlSKBDMPRTZvZHN3ElSthlNrUDWlpGR2gXWINWR0olZBlUdklUb5FHWr4Ue&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=RJUez10UiFTS3VXUZBVMGFTZtRGVpZ3dtZ0RBFFSuR3c3I0LYJWaJJWcQJkdhBXYSlEazxWc2JFZxdkTFBFNxdENoFVbOZEWjtmVLF2aCxEaxEFOCNGMQp2V6d0cn1GT4lTSzEFZVdXbz9UVrZUe4IWRpRnV2gER&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=1M3KMl1K4VVclZnSW9EURlXYkREMKpkbHFlZTtENMJVZ6dGSqFjQXN1dpNldzMHMNZDSIdlaWNWSTlWUNFTb28EN2cXaUhTYShlRGhzMQNFN6FHRyJzVM9yS1RTYQVWb5EnenRVNENUMVNlZ0o3crYzaD1WVlVEa&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=1M3KMl1K4VVclZnSW9EURlXYkREMKpkbHFlZTtENMJVZ6dGSqFjQXN1dpNldzMHMNZDSIdlaWNWSTlWU04WO08UZ3V0QGVGWwFmWLR2L05EaLtibEF1UKl2S1RTYQVWb5EnenRVNENUMVNlZ0o3crYzaD1WVlVEa&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=iNzd1YGbxcmRrgESYVHTlBlROJ0ZMV3bydFcEx2bMZ0NGd0NsZVO0gGSuFjQZpkZ350Q3gkY3V3btRFV0MVd1pHTjFHN0YGNmBnRZVkbSZldhd2RK92NJl1SaV0awQ0aD9ERsJzcN5UQhRVe2ZHS3EWR4VEbzdEO&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=3YjcrFnR3xWNChFTyY1b5A1Mu1mV0EkQ5YVSTZEayx0c0RGOux0VGV1LKhUWadHUYFnWZNXVY5kYPREWjtyQahjbBl2dvFzK050KRJmWkVmdRFnZCVDSUllVP9mYGxmYthHaNdTYJNXW2EXU4UEVEREURN0U0IHc&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=3YjcrFnR3xWNChFTyY1b5A1Mu1mV0EkQ5YVSTZEayx0c0RGOux0VGV1LKhUWadHUYFnWZNXVY5kYPREWxl0ZstSUyljb210Nat2N6JXTpZ0UXFUQ1QjQxlTSnBzUKhFea5WQxAnQJNXW2EXU4UEVEREURN0U0IHc&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=nBXYzImVzRVQ2MzUSVDTQ9yZF9SOvsyaYVVWkVUWDl3VBJXa6h2Y2kjUhBDM0QHdKJGcuNWT5h1RpZWYVh3UOt2Nk5mYZdURFhWcOBXZXZFaNdzM5hDNUNXTU92N5d3aN50M1MmQxIkUrN1QXxUT55GS2l0SJ90d&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=nBXYzImVzRVQ2MzUSVDTQ9yZF9SOvsyaYVVWkVUWDl3VBJXa6h2Y2kjUhBDM0QHdKJGcuNWT5h1RpZWYvxUVYdTR69mQPlTd2UGctdmQhR0QZRkTYtSZLtWWCZUVjNkMvYWYQd1RxIkUrN1QXxUT55GS2l0SJ90d&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=KdUQ1NFNUBnZl1mYoBXc3gmQIF0bBlGVi12cy9yMIdVYwklYxNHeTpHMZ1WTZFVNPRXVkZlRZFXbMFFZuNWdIJzV3QmazU1LMZDbNRjVIFDO2o1S0MjSyJ1cN1We2wkVKh2cqtEWiF2SFhkSFVjUw5GW4s0d5x0R&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=JpFazZmcyUVZiZlMBtyaQ5USxZnQ1UWYNRXVOJkTVJXToZEeJ9Wb0gnY6Vncn50bM9mcwcEe6lkWmJ0ZaJzTO9URvUmbmhld0YWZXhUZEdHeXh0UXZ3RSp1QTZ0Lkt2RjdEb1c1R28yd0sGOyJ0KSZDemNTWoVDe&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=JpFazZmcyUVZiZlMBtyaQ5USxZnQ1UWYNRXVOJkTVJXToZEeJ9Wb0gnY6Vncn50bM9mcwcEe6lkWmJ0ZwQVQWpGOodkcwckSD1ER5c2TzZkSOR1TYJFbyJ3YwtWR5JHTjdEb1c1R28yd0sGOyJ0KSZDemNTWoVDe&tablename=CJFDLAST2021&dflag=pdfdown']"
      ]
     },
     "execution_count": 289,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 获取详细页面中的PDF下载链接\n",
    "from requests_html import HTMLSession\n",
    "import urllib.parse\n",
    "\n",
    "session = HTMLSession()\n",
    "\n",
    "pdf_links=[]\n",
    "\n",
    "for url in links:\n",
    "    r = session.get(url)\n",
    "    pdf_link_xpath=r.html.xpath('//*[@id=\"pdfDown\"]/@href')[1]\n",
    "    pdf_links.append(pdf_link_xpath)\n",
    "\n",
    "pdf_links"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 290,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['https://kns.cnki.net/kcms/download.aspx?filename=mR4oGORl3K0YTS5YmMKVzatRDbtN3bZB3RylGWjlmY1okZI9CW3EDWrE2Uz0WbYJHeJNmYqJmRvF1Q=0DNQ5ERpNEeWJ1KQ52VoF3NwhUYMV1L5oWSHRlUWhUT55mWFlmQ2IXOsVjNvZTZFF1LslTZxwEdpd&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=UVmpGSP52TPl0MCNWSUBXdzUVaux0M28UZwIldUxmbWJ0dNlzUxc3QSNnS2IXTHVXUxR1blhWanhXU=0TS3lmTGpVUXZnWOlVQvkGe5d2cNl2UTJXblZ3Khl3d2FTQ2hDay8iUzo3btVVYB9kNit0UFxEW21&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=UVmpGSP52TPl0MCNWSUBXdzUVaux0M28UZwIldUxmbWJ0dNlzUxc3QSNnS2IXTHVXUxR1blhWanhXU=0zbJl1bCVDUlZmcGtyQMR1a3IXbjZDOnplclZ3Khl3d2FTQ2hDay8iUzo3btVVYB9kNit0UFxEW21&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=neMtGOtxUZxwUbNdDMZJTVLRFc5U1KGBjVPtkNnN1YrBjUX9WY18SSMJzTZRmU1syZSVEaGJ0TKlGV=0TWk9kRxYEVWlFW5k3SkRWd1Y0Nj9yQ0NnSIN0Q4NWZidWTvBTTLBjeD50aFFkaOFVeVFkdXRWVmZ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=HZmRjTiBlTGF1YHNDMKZzRllmU4AjbIRWTvklUQhXZys0ZHN0UTlzNGJzbQdUQwkGRD9mWnNFdkt0V=0zZLhTdyADUFtWVwQESoVWbTtWV3ImcMZlbLV2LThld1J2Qih1QLRndOlFZ1BlZ15keYh0NSJEZDp&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=TSvEEVWhzcxpHc0c3StVnSDJlNZR0VNlHTLpkVSd0VQRVdIB3VWJFU2JWV1l0a4lVQlh2UHRWWGVnW=0TR5cka0RjWu1WW5MWSyMFbitEZ6N1K3AndFNnQIVVSyIEUMpWe5N1T3MlZxRmY3ZnQZ1UU0QEdQR&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=TSvEEVWhzcxpHc0c3StVnSDJlNZR0VNlHTLpkVSd0VQRVdIB3VWJFU2JWV1l0a4lVQlh2UHRWWGVnW=0DNxcUZZhzRGR1RvhlSytCU2YUVyIDSxBndFNnQIVVSyIEUMpWe5N1T3MlZxRmY3ZnQZ1UU0QEdQR&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=lQThUNH5WN58CbKhFN2okcFRleBJDSlJFbsV0KuBzcsdzTLtERVRzQ4pETNBVONJWYwM1SoZXTaZGZ=0TQv50Yz92ayVTSWhVdlZDZ4UndaNGUFVVdltyUTZHSxkEcw0URUFkb6JWeHdDast0UwJWWZZTRmp&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=0VW9maClGOvp1SRxUaOdUaGhETXBHMCZjNQtUewolTwI0RuBVbml1cpZjYrlmRz8GZsRERJ9kcCh0Z=0zcRpkbkJXbvoEaxIHVr4GT0Y0NGZEVyQGV3UWYUNDN4JTR2YlVxMkdiR3dGNDVE1me5h0VUVVYqd&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=qd0VW9maClGOvp1SRxUaOdUaGhETXBHMCZjNQtUewolTwI0RuBVbml1cpZjYrlmRz8GZsRERJ9kcCh0Zj52b6F1Vj5GTz92aHl0Mzl1VKdDTEJkdzxUeORVcrZTU0NXRyJGMphGbxMkdiR3dGNDVE1me5h0VUVVY&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FhjT4JzatNmajNUdW9ENih3RBJEO510R4cHeq1EROBnUntyVENXaz9WRENlWXZmbvAzV24mdhp1VWNnaxRGUSJGTS12ZhxUN5x2SRlXQJRXc3RnVqB3TodjN0VVWIVlR4gUYndVTBVWO2V2U3plaZh2VMJUWQhHb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FeKh1cYNzYQ5URWFXcwNmarsGVys2RSx0NHNkZaRjNz1EMwJnaLpERE5mco5WY4BlSVllbCJ3SxNWb=0TRW10caFkSvdlT0YkVxlGRZpmaTRDWYJDeaBzMttUTXlWa6RVbmVWYwhHWk1UShdnNuJ2Tih3UyZ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FU5NmQiNEN1w0QSZEWz0mSEFDdENlav52NVpkUrFnVwhnYsVWTsFlWMp0K25kYu90QCp0ZjtEcTVUc=0zZjpkZIF3RQRmUVlEOGVTVZFmTNRUYLd2Ui1mZ09icWZWQBVzdspGcNh1LOF1LSd0QWtGO3kGRul&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FU5NmQiNEN1w0QSZEWz0mSEFDdENlav52NVpkUrFnVwhnYsVWTsFlWMp0K25kYu90QCp0ZjtEcTVUc=0DMClDajJHSQRmUVlEOGVTVZFmTNRUYLd2Ui1mZ09icWZWQBVzdspGcNh1LOF1LSd0QWtGO3kGRul&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=ElVV182SxQWNyUWNEZzM4hkVWNVQCVVbVl2SWFDTshWV5UGSBJnYURHTtlVN6RkQ380MIRXUENWVtBHdEJWQl9EawFFVUpHRJdGUZd3NOBzU5gWcSpndvh2KVh3QOVXUvATbmdnN4R1NVdnRM5EV0BlcXVTV0V2R&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=idVQmtketNUZLVGc1cGaL5WZmx0auh3bDV2KBFTTxMTV0JGOQtSS2FUYvR2NGpGWuFXWwVmSk5mQPp1dltiQrAFSzEVSzEjYnd3aDJmT2MUN4UHcrEWdVpHZaZlQx82MqRlUMJUSRRHMolFNzIGSTJ2NzQnbiNWd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=idVQmtketNUZLVGc1cGaL5WZmx0auh3bDV2KBFTTxMTV0JGOQtSS2FUYvR2NGpGWuFXWwVmSk5mQPp1dqp0RycGSykUYTpWdk9mZwFVVY9SW0NHdlV0aJZVVSJHezdnTxFkQrYzNURHMolFNzIGSTJ2NzQnbiNWd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=sd3QQRXUWNnSEtkR1Z0RYljN08mSWhFTlRUNzhUWIBzMEd1VDt2MWhWdYBnb3J1RxJVRrAlQFdkbpNkeI5Wca9EVZ9iWN9EUwZGRvJTS1B3aV1kUlBVWMhnYwUTUHJkUO5WUw82M1RXMI1WZkZzL4ZHT2lGO0EHd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=sd3QQRXUWNnSEtkR1Z0RYljN08mSWhFTlRUNzhUWIBzMEd1VDt2MWhWdYBnb3J1RxJVRrAlQFdkbpNkeZZmdXBFVZ9iWN9EUwZGRvJTS1B3aV1kUlBVWMhnYwUTUHJkUO5WUw82M1RXMI1WZkZzL4ZHT2lGO0EHd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=ZZlM5x0K2lnVDZHa4oFTshjd240YS9Eb35mSxxEdOZlSSlVWiREM2A1cHJ0ZXlETuFVU2JUdml1UL1GRudjN44kMPFFTVFkMKRGMhR2TalzQ4EFdZJEO2Jkb1pVYBRXNpVzQYlTS3FmcUF3ROhTWjZjeBpkbvgFc&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=GaTlWQOZHezEEUV9ib5YkQttUOkdGTMV2Z2dURMhjWSdzMNh2dpVnWGpEchhVMqdFMCtWbHpWemd1R=0zdoRnYFV2Vxh2ZKhGZ5h1MKNUcNpnRRhjMzh0dUdmVzlmS4RGZkNVb0R2NNZXN4QHevkjU5Ukc2E&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=DZUxEaJ9Wd4JkbCB1YT9CZMt0bxl0L21EarxUQ2o3Z3UVRCtGezQFT5pHOq10bQ9UNzpWSChnYYdHV=0zaz4WYwkVU540dPxGZhZ1TEZna5M0YaZncBR0MzFUaOdVW5w0N6BFW4EmcFZGSkJGa1U2bpRENml&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=DZUxEaJ9Wd4JkbCB1YT9CZMt0bxl0L21EarxUQ2o3Z3UVRCtGezQFT5pHOq10bQ9UNzpWSChnYYdHV=0za5xUNxkVU540dPxGZhZ1TEZna5M0YaZncBR0MzFUaOdVW5w0N6BFW4EmcFZGSkJGa1U2bpRENml&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=TTzVzNsBzKTt0ZNNzLntWSYdlZ0kDSldXSQZlUDJ3Z3x0LLp1MxgTYvtCWC1mcJVUdHVlQiF1Ryd2V=0TQTRFb4JUcyAFaxRjWvVnUuFlVZFnUyJkVORjWQ9yYmNHdhtyQIdFdDJETrYUd5YVO6JlRaVFS0k&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=TTzVzNsBzKTt0ZNNzLntWSYdlZ0kDSldXSQZlUDJ3Z3x0LLp1MxgTYvtCWC1mcJVUdHVlQiF1Ryd2V=0DNqhTe4JUcyAFaxRjWvVnUuFlVZFnUyJkVORjWQ9yYmNHdhtyQIdFdDJETrYUd5YVO6JlRaVFS0k&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=VMZdGdyZUMPtie4wWeK9EcJl3ZwU1VuZVcvYTVxcXUQdnWaNjTxtEUNd1KKhVM3cXShBHZkRnWvRHZ=0TWMBlZ39kNJdFOphVZXNHVOFGdJRUYwBDT4kGTEtieOJDURh0T2hkcK12brFUMrRVSn1kNuZ3S1o&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=VMZdGdyZUMPtie4wWeK9EcJl3ZwU1VuZVcvYTVxcXUQdnWaNjTxtEUNd1KKhVM3cXShBHZkRnWvRHZ=0zYihke49kNJdFOphVZXNHVOFGdJRUYwBDT4kGTEtieOJDURh0T2hkcK12brFUMrRVSn1kNuZ3S1o&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=ztkZolEdPNjZv9GUaJ2VTFWYJRzKuFFOzMleiNTcBdjaPdDTXhESzpUTJxWY4JETkV3NzF2VExURRV2ZDFjYtRnSRticyYUMu90MGh3by5ENxEnWspkc3Vnb4kke4lDSyJmSZhjTqZnY2oUc2p2V50GVthmWrtWe&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=NJ0bZNGTZtiSWFHU5NlQER0M3lXdyw2R4wUVlZFN5tSYOFnQtRndGJVa3FFerIjYrQDexdHS49GWNJnboVmenlGNaR2R5oXcRhDNxhkRVtGSwAnWIdlNvEzVzg2SyQzdhlGaUZmQOl0UxkVUyZXY3ZHeygGRpVlS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=NJ0bZNGTZtiSWFHU5NlQER0M3lXdyw2R4wUVlZFN5tSYOFnQtRndGJVa3FFerIjYrQDexdHS49GWNJnboR3K082LmdEd5dWZ4IzRrFXWV9CWCp0dPJGR2RmUUNWYo5mcWtSbQx2SOl0UxkVUyZXY3ZHeygGRpVlS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=2gGd0gmUK52S5JmM15GW4xUe4dkdLhlMKZ0UkRmNHFkUxoHaGRFahNHTaBVW4IjNmFURydmeZh0QnJWcHNjQN1URT1kSMZFOvolZnJkZzwGR5VnaulVRJ5WSQZ3K6tmRD90Sz00TqJXenh0Y390Vvo1NPVnMkhDc&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=0MNhWQBlmRkNkeZplMUx2L5BnYR5UN4RzTFR2LSVUbHRTOjFkeyY0Ka90UohGZK5mUkp1c5NFaKxEd=0TQrg1TaJVSmBFNpJXVL9WOw0WdqJkNhJmaWpGRwsWbrNjZwgEazIUdLdGakNFdBF3K3JEcDZFcyE&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=QFUZhZ2YUhGaINFd5B3MpZVQlhUMnZGeZR1cPFzZ55EZTZmZ4FTbxVjVDpkTrMlWyR0ait0aatmVk92dYVnTmVDehF0KrVWZR5URKdkQzk2d0NVTZVTTUh2btZnaMp1Vw40VZpFcNplTG5kV3IXRLd3ZJZFc4EVS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=DN3SZBnWyJHbxcHV3gkZwAlWYJ0S1hUY1ZWc0hkVRFTNzAHdrNHM1g3ULhkbl1GUnN2RIZmVhZlZapEROhlRGRDM4kFT4hHaZFnSRJVMEV1a5sGcDplQFd3K18WVLl3TwMUYJ12cxlzT1UzdBdUavQWcPR2dQhVe&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=DN3SZBnWyJHbxcHV3gkZwAlWYJ0S1hUY1ZWc0hkVRFTNzAHdrNHM1g3ULhkbl1GUnN2RIZmVhZlZapERxUFWrkXdYNVVa9yanFUTuhHOUR1aktSSBZXY1ZEeiJUOuFmR1kzR5cnNxlzT1UzdBdUavQWcPR2dQhVe&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=RB1S6Fna5M0MzMEdVR1QahEN48WRq5WRnxUQLFzMu5UcwtWbYdXVyZzTQp2NyIldwYzKpFlTCdGT0x2RLN0YKRjVklVRpNmWrA1TPtES2M1Q2dja090UVl1M6NUUUNkYpx2QVRWTv9mQLlWRqZzbnNzcOhTSntSR&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=RB1S6Fna5M0MzMEdVR1QahEN48WRq5WRnxUQLFzMu5UcwtWbYdXVyZzTQp2NyIldwYzKpFlTCdGT0x2R3RWTEBXe5RWeTFXd5NVTmtGeRVUUKd3bnxEWipnZvUXdkpXSEF2UPB1Vv9mQLlWRqZzbnNzcOhTSntSR&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=WN0RP10dXJGV3BjZBVnS4ImRLVHM4BHV0MGU3QnRvlWVa1kVKJHZmd2Vx5kM18We6ZzTHJUejlXeXZ1SQ9UYZFnZtllQKFzTidlcC1EVSZTWyIWMrp1YvIjMPxmcJxkQSlVZTRjUINWR0olZBlUdklUb5FHWr4Ue&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=WN0RP10dXJGV3BjZBVnS4ImRLVHM4BHV0MGU3QnRvlWVa1kVKJHZmd2Vx5kM18We6ZzTHJUejlXeXZ1SKZ1bvY0SLZFbodDNTxUQChlSKBDMPRTZvZHN3ElSthlNrUDWlpGR2gXWINWR0olZBlUdklUb5FHWr4Ue&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=RJUez10UiFTS3VXUZBVMGFTZtRGVpZ3dtZ0RBFFSuR3c3I0LYJWaJJWcQJkdhBXYSlEazxWc2JFZxdkTFBFNxdENoFVbOZEWjtmVLF2aCxEaxEFOCNGMQp2V6d0cn1GT4lTSzEFZVdXbz9UVrZUe4IWRpRnV2gER&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=1M3KMl1K4VVclZnSW9EURlXYkREMKpkbHFlZTtENMJVZ6dGSqFjQXN1dpNldzMHMNZDSIdlaWNWSTlWUNFTb28EN2cXaUhTYShlRGhzMQNFN6FHRyJzVM9yS1RTYQVWb5EnenRVNENUMVNlZ0o3crYzaD1WVlVEa&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=1M3KMl1K4VVclZnSW9EURlXYkREMKpkbHFlZTtENMJVZ6dGSqFjQXN1dpNldzMHMNZDSIdlaWNWSTlWU04WO08UZ3V0QGVGWwFmWLR2L05EaLtibEF1UKl2S1RTYQVWb5EnenRVNENUMVNlZ0o3crYzaD1WVlVEa&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=iNzd1YGbxcmRrgESYVHTlBlROJ0ZMV3bydFcEx2bMZ0NGd0NsZVO0gGSuFjQZpkZ350Q3gkY3V3btRFV0MVd1pHTjFHN0YGNmBnRZVkbSZldhd2RK92NJl1SaV0awQ0aD9ERsJzcN5UQhRVe2ZHS3EWR4VEbzdEO&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=3YjcrFnR3xWNChFTyY1b5A1Mu1mV0EkQ5YVSTZEayx0c0RGOux0VGV1LKhUWadHUYFnWZNXVY5kYPREWjtyQahjbBl2dvFzK050KRJmWkVmdRFnZCVDSUllVP9mYGxmYthHaNdTYJNXW2EXU4UEVEREURN0U0IHc&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=3YjcrFnR3xWNChFTyY1b5A1Mu1mV0EkQ5YVSTZEayx0c0RGOux0VGV1LKhUWadHUYFnWZNXVY5kYPREWxl0ZstSUyljb210Nat2N6JXTpZ0UXFUQ1QjQxlTSnBzUKhFea5WQxAnQJNXW2EXU4UEVEREURN0U0IHc&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=nBXYzImVzRVQ2MzUSVDTQ9yZF9SOvsyaYVVWkVUWDl3VBJXa6h2Y2kjUhBDM0QHdKJGcuNWT5h1RpZWYVh3UOt2Nk5mYZdURFhWcOBXZXZFaNdzM5hDNUNXTU92N5d3aN50M1MmQxIkUrN1QXxUT55GS2l0SJ90d&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=nBXYzImVzRVQ2MzUSVDTQ9yZF9SOvsyaYVVWkVUWDl3VBJXa6h2Y2kjUhBDM0QHdKJGcuNWT5h1RpZWYvxUVYdTR69mQPlTd2UGctdmQhR0QZRkTYtSZLtWWCZUVjNkMvYWYQd1RxIkUrN1QXxUT55GS2l0SJ90d&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=KdUQ1NFNUBnZl1mYoBXc3gmQIF0bBlGVi12cy9yMIdVYwklYxNHeTpHMZ1WTZFVNPRXVkZlRZFXbMFFZuNWdIJzV3QmazU1LMZDbNRjVIFDO2o1S0MjSyJ1cN1We2wkVKh2cqtEWiF2SFhkSFVjUw5GW4s0d5x0R&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=JpFazZmcyUVZiZlMBtyaQ5USxZnQ1UWYNRXVOJkTVJXToZEeJ9Wb0gnY6Vncn50bM9mcwcEe6lkWmJ0ZaJzTO9URvUmbmhld0YWZXhUZEdHeXh0UXZ3RSp1QTZ0Lkt2RjdEb1c1R28yd0sGOyJ0KSZDemNTWoVDe&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=JpFazZmcyUVZiZlMBtyaQ5USxZnQ1UWYNRXVOJkTVJXToZEeJ9Wb0gnY6Vncn50bM9mcwcEe6lkWmJ0ZwQVQWpGOodkcwckSD1ER5c2TzZkSOR1TYJFbyJ3YwtWR5JHTjdEb1c1R28yd0sGOyJ0KSZDemNTWoVDe&tablename=CJFDLAST2021&dflag=pdfdown']"
      ]
     },
     "execution_count": 290,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 修复完整的PDF下载链接\n",
    "pdf_href=['https://kns.cnki.net'+link for link in pdf_links]\n",
    "pdf_href"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 291,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详情页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>基于计算机的大数据和云计算技术探析</td>\n",
       "      <td>马珺杰</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>大数据背景下的人工智能在计算机网络技术中的应用研究</td>\n",
       "      <td>王婧; 张学娜</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>大数据时代计算机网络安全防范分析</td>\n",
       "      <td>楚丙奇</td>\n",
       "      <td>办公自动化</td>\n",
       "      <td>2021-07-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究</td>\n",
       "      <td>赵于卓; 黄子莹</td>\n",
       "      <td>中国商论</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>GIS专业自然地理学野外实习的教学改革实践</td>\n",
       "      <td>吴小芳; 钟晓兰; 谢刚生; 何正勇</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>49.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>基于GIS的入侵生物适生区预测——以桔小实蝇为例</td>\n",
       "      <td>张华纬; 赵健; 李志鹏</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-06-24</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>GIS技术在地理空间教学实践中的应用</td>\n",
       "      <td>马炎池</td>\n",
       "      <td>电子技术</td>\n",
       "      <td>2021-06-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>152.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>新工科视域下计算机科学与技术专业大数据方向培养体系探索</td>\n",
       "      <td>李金忠</td>\n",
       "      <td>台州学院学报</td>\n",
       "      <td>2021-06-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>17.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>基于RS和GIS技术的西藏多龙矿集区矿山选址研究</td>\n",
       "      <td>赵龙贤;代晶晶;赵元艺;姜琪;刘婷玥</td>\n",
       "      <td>国土资源遥感</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>大数据时代信息伦理的困境与应对研究</td>\n",
       "      <td>梁宇; 郑易平</td>\n",
       "      <td>科学技术哲学研究</td>\n",
       "      <td>2021-06-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>542.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>基于“BIM+GIS”的运营城市轨道交通安全监测与评估  网络首发</td>\n",
       "      <td>罗海涛</td>\n",
       "      <td>铁道勘察</td>\n",
       "      <td>2021-06-02 17:41</td>\n",
       "      <td>NaN</td>\n",
       "      <td>339.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>安富利携手合作伙伴共同展示AI创新技术及应用</td>\n",
       "      <td>NaN</td>\n",
       "      <td>单片机与嵌入式系统应用</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>基于计算机的大数据和云计算技术分析</td>\n",
       "      <td>秦蓉</td>\n",
       "      <td>数字通信世界</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>大数据背景下的开放教育计算机专业教育改革研究</td>\n",
       "      <td>段超</td>\n",
       "      <td>数字通信世界</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>基于GIS的大藤峡水库泄洪下游淹没影响模拟与分析</td>\n",
       "      <td>吴娟</td>\n",
       "      <td>山西农经</td>\n",
       "      <td>2021-05-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>19.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>基于计算思维的“Python程序设计”课程教学研究</td>\n",
       "      <td>罗平娟; 彭芳策</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>71.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>地理信息系统课程实践教学中改进方法的探究</td>\n",
       "      <td>赵天明</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>80.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>基于GIS的徐州市火灾应急救援系统设计与实现</td>\n",
       "      <td>仲旸; 李保杰; 笪柳炎</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>237.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>GIS技术在城市轨道交通安全监测中的应用研究——以某新建地铁穿越既有地铁安全监测为例</td>\n",
       "      <td>谭磊; 贺美德; 柳飞</td>\n",
       "      <td>测绘与空间地理信息</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>206.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>基于大数据的设备分析系统研究</td>\n",
       "      <td>王学松; 刘天才</td>\n",
       "      <td>自动化与仪器仪表</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>基于Python的图书馆信息管理系统研发</td>\n",
       "      <td>胡小春; 田婧; 陈燕</td>\n",
       "      <td>信息技术与信息化</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>159.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>计算机软件技术在大数据时代的应用分析</td>\n",
       "      <td>鄢冲</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>14.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>大数据时代下计算机软件技术的应用分析</td>\n",
       "      <td>陈建伟</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>大数据背景下计算机信息技术在网络安全中的运用探析</td>\n",
       "      <td>格桑次仁</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>11.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>大数据背景下高职计算机应用技术移动学习的研究</td>\n",
       "      <td>赵建伟</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>大数据时代下计算机软件技术的应用</td>\n",
       "      <td>李永刚</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>大数据环境在“计算机组装与维护”课程教学改革研究中的应用</td>\n",
       "      <td>程光璇; 刘慧</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>大数据与计算机网络的信息安全策略分析</td>\n",
       "      <td>李培培</td>\n",
       "      <td>电子技术</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>423.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>大数据时代计算机科学与技术专业改造升级路径探索</td>\n",
       "      <td>赵建华; 刘宁</td>\n",
       "      <td>微型电脑应用</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>182.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>工业互联网背景下大数据技术应用与计算机信息管理专业的融合研究</td>\n",
       "      <td>贺宁; 邹晓华; 唐丽萍</td>\n",
       "      <td>江苏科技信息</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>50.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>大数据背景下地方高校人工智能方向人才培养模式探索</td>\n",
       "      <td>叶青; 刘长华</td>\n",
       "      <td>湖北工程学院学报</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>GIS技术在农村饮水安全工程评价系统中的应用</td>\n",
       "      <td>房凯</td>\n",
       "      <td>农业工程</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>基于Python Flask的运维信息管理系统设计与实现</td>\n",
       "      <td>冷四军</td>\n",
       "      <td>电脑编程技巧与维护</td>\n",
       "      <td>2021-05-18</td>\n",
       "      <td>NaN</td>\n",
       "      <td>135.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>面向大数据信息时代计算机科学的应用探析</td>\n",
       "      <td>彭雪</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>111.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>基于大数据时代人工智能在计算机网络技术中的应用</td>\n",
       "      <td>李晓霞</td>\n",
       "      <td>电子测试</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>53.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>浅谈GIS对于开展地理教学的影响</td>\n",
       "      <td>王莉; 阿里木江·卡斯木</td>\n",
       "      <td>科学咨询(教育科研)</td>\n",
       "      <td>2021-05-14</td>\n",
       "      <td>NaN</td>\n",
       "      <td>153.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>大数据在粮库信息化中的应用</td>\n",
       "      <td>刘廷凤; 吴建军</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2021-05-12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>152.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>《大学信息技术（Python程序设计）》基于MOOC的线上线下混合教学模式课程建设研究</td>\n",
       "      <td>陈艳; 吴珍珍</td>\n",
       "      <td>河北农机</td>\n",
       "      <td>2021-05-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>AIPerf：大规模人工智能算力基准测试程序</td>\n",
       "      <td>翟季冬</td>\n",
       "      <td>大数据</td>\n",
       "      <td>2021-05-06 16:32</td>\n",
       "      <td>NaN</td>\n",
       "      <td>69.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>基于stm32系统与物联网的AI多功能门禁系统研究</td>\n",
       "      <td>林佳智;常凤筠;朱文斌;朱瑞昕;张天赐</td>\n",
       "      <td>科学技术创新</td>\n",
       "      <td>2021-05-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>236.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>大数据时代下人工智能在计算机网络技术中的运用探讨</td>\n",
       "      <td>杨文学</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-05-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>38.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>大数据驱动的计算机网络远程教学质量评价研究</td>\n",
       "      <td>云洁; 白雪</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2021-05-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>149.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>基于GIS的城市地下管线信息管理系统研究与实现</td>\n",
       "      <td>孙凯;王青</td>\n",
       "      <td>数字通信世界</td>\n",
       "      <td>2021-05-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>32.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>基于Python Flask的温度数据可视化</td>\n",
       "      <td>胡钊</td>\n",
       "      <td>电子世界</td>\n",
       "      <td>2021-04-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>274.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>大数据在地理信息系统中的应用探索</td>\n",
       "      <td>黄相维</td>\n",
       "      <td>黑龙江水利科技</td>\n",
       "      <td>2021-04-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>123.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>地理信息系统GIS在城市测绘中的应用研究</td>\n",
       "      <td>肖玉勇</td>\n",
       "      <td>智能城市</td>\n",
       "      <td>2021-04-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>309.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>大数据时代网络信息安全及对应策略研究</td>\n",
       "      <td>集世璞</td>\n",
       "      <td>中小企业管理与科技(下旬刊)</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>405.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>基于大数据的计算机专业学生就业方向研究</td>\n",
       "      <td>陈欣; 江悦</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>119.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>GIS与语言学交叉研究</td>\n",
       "      <td>韦韧</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>103.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>基于遥感和地理信息系统的内蒙古呼日查干淖尔地区生态脆弱性评价</td>\n",
       "      <td>周玲美; 王世航; 权玲</td>\n",
       "      <td>生态与农村环境学报</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>274.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                           篇名  \\\n",
       "0            1                            基于计算机的大数据和云计算技术探析   \n",
       "1            2                    大数据背景下的人工智能在计算机网络技术中的应用研究   \n",
       "2            3                             大数据时代计算机网络安全防范分析   \n",
       "3            4                 基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究   \n",
       "4            5                        GIS专业自然地理学野外实习的教学改革实践   \n",
       "5            6                     基于GIS的入侵生物适生区预测——以桔小实蝇为例   \n",
       "6            7                           GIS技术在地理空间教学实践中的应用   \n",
       "7            8                  新工科视域下计算机科学与技术专业大数据方向培养体系探索   \n",
       "8            9                     基于RS和GIS技术的西藏多龙矿集区矿山选址研究   \n",
       "9           10                            大数据时代信息伦理的困境与应对研究   \n",
       "10          11            基于“BIM+GIS”的运营城市轨道交通安全监测与评估  网络首发   \n",
       "11          12                       安富利携手合作伙伴共同展示AI创新技术及应用   \n",
       "12          13                            基于计算机的大数据和云计算技术分析   \n",
       "13          14                       大数据背景下的开放教育计算机专业教育改革研究   \n",
       "14          15                     基于GIS的大藤峡水库泄洪下游淹没影响模拟与分析   \n",
       "15          16                    基于计算思维的“Python程序设计”课程教学研究   \n",
       "16          17                         地理信息系统课程实践教学中改进方法的探究   \n",
       "17          18                       基于GIS的徐州市火灾应急救援系统设计与实现   \n",
       "18          19   GIS技术在城市轨道交通安全监测中的应用研究——以某新建地铁穿越既有地铁安全监测为例   \n",
       "19          20                               基于大数据的设备分析系统研究   \n",
       "20          21                         基于Python的图书馆信息管理系统研发   \n",
       "21          22                           计算机软件技术在大数据时代的应用分析   \n",
       "22          23                           大数据时代下计算机软件技术的应用分析   \n",
       "23          24                     大数据背景下计算机信息技术在网络安全中的运用探析   \n",
       "24          25                       大数据背景下高职计算机应用技术移动学习的研究   \n",
       "25          26                             大数据时代下计算机软件技术的应用   \n",
       "26          27                 大数据环境在“计算机组装与维护”课程教学改革研究中的应用   \n",
       "27          28                           大数据与计算机网络的信息安全策略分析   \n",
       "28          29                      大数据时代计算机科学与技术专业改造升级路径探索   \n",
       "29          30               工业互联网背景下大数据技术应用与计算机信息管理专业的融合研究   \n",
       "30          31                     大数据背景下地方高校人工智能方向人才培养模式探索   \n",
       "31          32                       GIS技术在农村饮水安全工程评价系统中的应用   \n",
       "32          33                 基于Python Flask的运维信息管理系统设计与实现   \n",
       "33          34                          面向大数据信息时代计算机科学的应用探析   \n",
       "34          35                      基于大数据时代人工智能在计算机网络技术中的应用   \n",
       "35          36                             浅谈GIS对于开展地理教学的影响   \n",
       "36          37                                大数据在粮库信息化中的应用   \n",
       "37          38  《大学信息技术（Python程序设计）》基于MOOC的线上线下混合教学模式课程建设研究   \n",
       "38          39                       AIPerf：大规模人工智能算力基准测试程序   \n",
       "39          40                    基于stm32系统与物联网的AI多功能门禁系统研究   \n",
       "40          41                     大数据时代下人工智能在计算机网络技术中的运用探讨   \n",
       "41          42                        大数据驱动的计算机网络远程教学质量评价研究   \n",
       "42          43                      基于GIS的城市地下管线信息管理系统研究与实现   \n",
       "43          44                       基于Python Flask的温度数据可视化   \n",
       "44          45                             大数据在地理信息系统中的应用探索   \n",
       "45          46                         地理信息系统GIS在城市测绘中的应用研究   \n",
       "46          47                           大数据时代网络信息安全及对应策略研究   \n",
       "47          48                          基于大数据的计算机专业学生就业方向研究   \n",
       "48          49                                  GIS与语言学交叉研究   \n",
       "49          50               基于遥感和地理信息系统的内蒙古呼日查干淖尔地区生态脆弱性评价   \n",
       "\n",
       "                     作者              刊名              发表时间  被引     下载  操作  \\\n",
       "0                   马珺杰  中小企业管理与科技(中旬刊)        2021-07-02 NaN    NaN  下载   \n",
       "1               王婧; 张学娜  中小企业管理与科技(中旬刊)        2021-07-02 NaN    NaN  下载   \n",
       "2                   楚丙奇           办公自动化        2021-07-01 NaN    NaN  下载   \n",
       "3              赵于卓; 黄子莹            中国商论        2021-06-30 NaN    NaN  下载   \n",
       "4    吴小芳; 钟晓兰; 谢刚生; 何正勇            测绘通报        2021-06-25 NaN   49.0  下载   \n",
       "5          张华纬; 赵健; 李志鹏       测绘与空间地理信息        2021-06-24 NaN   64.0  下载   \n",
       "6                   马炎池            电子技术        2021-06-20 NaN  152.0  下载   \n",
       "7                   李金忠          台州学院学报        2021-06-20 NaN   17.0  下载   \n",
       "8    赵龙贤;代晶晶;赵元艺;姜琪;刘婷玥          国土资源遥感        2021-06-15 NaN    9.0  下载   \n",
       "9               梁宇; 郑易平        科学技术哲学研究        2021-06-05 NaN  542.0  下载   \n",
       "10                  罗海涛            铁道勘察  2021-06-02 17:41 NaN  339.0  下载   \n",
       "11                  NaN     单片机与嵌入式系统应用        2021-06-01 NaN    NaN  下载   \n",
       "12                   秦蓉          数字通信世界        2021-06-01 NaN    NaN  下载   \n",
       "13                   段超          数字通信世界        2021-06-01 NaN    NaN  下载   \n",
       "14                   吴娟            山西农经        2021-05-30 NaN   19.0  下载   \n",
       "15             罗平娟; 彭芳策         电脑知识与技术        2021-05-25 NaN   71.0  下载   \n",
       "16                  赵天明       测绘与空间地理信息        2021-05-25 NaN   80.0  下载   \n",
       "17         仲旸; 李保杰; 笪柳炎       测绘与空间地理信息        2021-05-25 NaN  237.0  下载   \n",
       "18          谭磊; 贺美德; 柳飞       测绘与空间地理信息        2021-05-25 NaN  206.0  下载   \n",
       "19             王学松; 刘天才        自动化与仪器仪表        2021-05-25 NaN   24.0  下载   \n",
       "20          胡小春; 田婧; 陈燕        信息技术与信息化        2021-05-25 NaN  159.0  下载   \n",
       "21                   鄢冲         数字技术与应用        2021-05-25 NaN   14.0  下载   \n",
       "22                  陈建伟         数字技术与应用        2021-05-25 NaN    8.0  下载   \n",
       "23                 格桑次仁         数字技术与应用        2021-05-25 NaN   11.0  下载   \n",
       "24                  赵建伟         数字技术与应用        2021-05-25 NaN    3.0  下载   \n",
       "25                  李永刚          无线互联科技        2021-05-25 NaN    NaN  下载   \n",
       "26              程光璇; 刘慧          无线互联科技        2021-05-25 NaN    NaN  下载   \n",
       "27                  李培培            电子技术        2021-05-20 NaN  423.0  下载   \n",
       "28              赵建华; 刘宁          微型电脑应用        2021-05-20 NaN  182.0  下载   \n",
       "29         贺宁; 邹晓华; 唐丽萍          江苏科技信息        2021-05-20 NaN   50.0  下载   \n",
       "30              叶青; 刘长华        湖北工程学院学报        2021-05-20 NaN   61.0  下载   \n",
       "31                   房凯            农业工程        2021-05-20 NaN    1.0  下载   \n",
       "32                  冷四军       电脑编程技巧与维护        2021-05-18 NaN  135.0  下载   \n",
       "33                   彭雪  中小企业管理与科技(中旬刊)        2021-05-15 NaN  111.0  下载   \n",
       "34                  李晓霞            电子测试        2021-05-15 NaN   53.0  下载   \n",
       "35         王莉; 阿里木江·卡斯木      科学咨询(教育科研)        2021-05-14 NaN  153.0  下载   \n",
       "36             刘廷凤; 吴建军          现代电子技术        2021-05-12 NaN  152.0  下载   \n",
       "37              陈艳; 吴珍珍            河北农机        2021-05-10 NaN   33.0  下载   \n",
       "38                  翟季冬             大数据  2021-05-06 16:32 NaN   69.0  下载   \n",
       "39  林佳智;常凤筠;朱文斌;朱瑞昕;张天赐          科学技术创新        2021-05-05 NaN  236.0  下载   \n",
       "40                  杨文学         电脑知识与技术        2021-05-05 NaN   38.0  下载   \n",
       "41               云洁; 白雪          现代电子技术        2021-05-01 NaN  149.0  下载   \n",
       "42                孙凯;王青          数字通信世界        2021-05-01 NaN   32.0  下载   \n",
       "43                   胡钊            电子世界        2021-04-30 NaN  274.0  下载   \n",
       "44                  黄相维         黑龙江水利科技        2021-04-30 NaN  123.0  下载   \n",
       "45                  肖玉勇            智能城市        2021-04-28 NaN  309.0  下载   \n",
       "46                  集世璞  中小企业管理与科技(下旬刊)        2021-04-25 NaN  405.0  下载   \n",
       "47               陈欣; 江悦         电脑知识与技术        2021-04-25 NaN  119.0  下载   \n",
       "48                   韦韧            测绘通报        2021-04-25 NaN  103.0  下载   \n",
       "49         周玲美; 王世航; 权玲       生态与农村环境学报        2021-04-25 NaN  274.0  下载   \n",
       "\n",
       "                                                详情页链接  \\\n",
       "0   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "5   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "6   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "7   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "8   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "9   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "10  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "11  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "12  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "13  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "14  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "15  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "16  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "17  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "18  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "19  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "20  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "21  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "22  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "23  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "24  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "25  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "26  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "27  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "28  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "29  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "30  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "31  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "32  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "33  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "34  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "35  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "36  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "37  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "38  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "39  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "40  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "41  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "42  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "43  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "44  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "45  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "46  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "47  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "48  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "49  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                              PDF下载链接  \n",
       "0   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "5   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "6   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "7   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "8   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "9   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "10  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "11  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "12  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "13  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "14  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "15  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "16  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "17  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "18  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "19  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "20  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "21  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "22  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "23  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "24  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "25  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "26  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "27  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "28  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "29  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "30  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "31  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "32  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "33  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "34  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "35  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "36  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "37  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "38  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "39  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "40  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "41  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "42  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "43  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "44  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "45  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "46  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "47  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "48  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "49  https://kns.cnki.net/kcms/download.aspx?filena...  "
      ]
     },
     "execution_count": 291,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 合并PDF下载链接\n",
    "df_pdf_links=pd.DataFrame({'PDF下载链接':pdf_href})\n",
    "df_首页=pd.concat([df_首页,df_pdf_links],axis=1)\n",
    "df_首页"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 292,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 查看最大页码"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 293,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'共120页'"
      ]
     },
     "execution_count": 293,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "driver.find_element_by_xpath('//*[@id=\"gridTable\"]/div[2]/span[1]').get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 294,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'下一页'"
      ]
     },
     "execution_count": 294,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 翻页\n",
    "element = driver.find_element_by_id('PageNext')\n",
    "element.get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 295,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14]\n"
     ]
    }
   ],
   "source": [
    "page = list(range(1,15))\n",
    "print(page)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 296,
   "metadata": {},
   "outputs": [],
   "source": [
    "root_group=[]\n",
    "table_html = dict()\n",
    "main_content =\"\"\n",
    "element = None"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 299,
   "metadata": {},
   "outputs": [],
   "source": [
    "def page_process(pages):\n",
    "    for p in pages:\n",
    "        print(p,end='\\t')\n",
    "        driver.find_element_by_id('PageNext').click()\n",
    "        time.sleep(3)\n",
    "        \n",
    "        html=driver.page_source #获取页面源码\n",
    "        root=fromstring(html)\n",
    "        root_group.append(root) \n",
    "        \n",
    "        element = driver.find_element_by_id('gridTable')\n",
    "        main_content = element.get_attribute('innerHTML')\n",
    "        表格_html[p] = main_content"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 300,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\t2\t3\t4\t5\t6\t7\t8\t9\t10\t11\t12\t13\t14\t"
     ]
    }
   ],
   "source": [
    "page_process(page)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 301,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>html_snippets</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                        html_snippets\n",
       "0   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "1   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "2   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "3   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "4   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "5   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "6   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "7   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "8   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "9   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "10  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "11  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "12  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "13  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "14  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ..."
      ]
     },
     "execution_count": 301,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.DataFrame([表格_html]).T\n",
    "df.columns = [\"html_snippets\"]\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 302,
   "metadata": {},
   "outputs": [],
   "source": [
    "l_df = []\n",
    "for p in pages:\n",
    "    表格 = pd.read_html(表格_html[p])[0]\n",
    "    l_df.append(表格)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 303,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>51</td>\n",
       "      <td>大数据时代下计算机科学与技术专业综合改革</td>\n",
       "      <td>李洁</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>大数据背景下的计算机专业教学改革探讨</td>\n",
       "      <td>刘英</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>大数据时代计算机网络的安全问题及防范措施</td>\n",
       "      <td>赵培植</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>153.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>大数据时代计算机网络安全问题及对策分析</td>\n",
       "      <td>王研</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>68.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>大数据技术在计算机网络数据库建设中的运用</td>\n",
       "      <td>李少敏; 陈升晖</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>245</th>\n",
       "      <td>396</td>\n",
       "      <td>拖拉机电气故障诊断方法研究——基于深度学习理论和大数据</td>\n",
       "      <td>王素芳; 谢芳</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2020-08-21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>172.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>246</th>\n",
       "      <td>397</td>\n",
       "      <td>基于营配大数据的配网故障定位系统的设计与实现</td>\n",
       "      <td>袁忠军;王丹;段湛辉;陈业伟;李明勇</td>\n",
       "      <td>电力大数据</td>\n",
       "      <td>2020-08-21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>17.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>247</th>\n",
       "      <td>398</td>\n",
       "      <td>要重视AI基础理论的创新——记姚期智院士在2020世界人工智能大会上的演讲</td>\n",
       "      <td>蔚子</td>\n",
       "      <td>上海质量</td>\n",
       "      <td>2020-08-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>32.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>248</th>\n",
       "      <td>399</td>\n",
       "      <td>基于大数据技术的公安情报流程分析</td>\n",
       "      <td>郝赫</td>\n",
       "      <td>电子技术</td>\n",
       "      <td>2020-08-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>154.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>249</th>\n",
       "      <td>400</td>\n",
       "      <td>大数据时代计算机网络安全及防范措施探析</td>\n",
       "      <td>彭鹏</td>\n",
       "      <td>黑龙江科学</td>\n",
       "      <td>2020-08-18</td>\n",
       "      <td>5.0</td>\n",
       "      <td>249.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>250 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                                     篇名                  作者  \\\n",
       "0            51                   大数据时代下计算机科学与技术专业综合改革                  李洁   \n",
       "1            52                     大数据背景下的计算机专业教学改革探讨                  刘英   \n",
       "2            53                   大数据时代计算机网络的安全问题及防范措施                 赵培植   \n",
       "3            54                    大数据时代计算机网络安全问题及对策分析                  王研   \n",
       "4            55                   大数据技术在计算机网络数据库建设中的运用            李少敏; 陈升晖   \n",
       "..          ...                                    ...                 ...   \n",
       "245         396            拖拉机电气故障诊断方法研究——基于深度学习理论和大数据             王素芳; 谢芳   \n",
       "246         397                 基于营配大数据的配网故障定位系统的设计与实现  袁忠军;王丹;段湛辉;陈业伟;李明勇   \n",
       "247         398  要重视AI基础理论的创新——记姚期智院士在2020世界人工智能大会上的演讲                  蔚子   \n",
       "248         399                       基于大数据技术的公安情报流程分析                  郝赫   \n",
       "249         400                    大数据时代计算机网络安全及防范措施探析                  彭鹏   \n",
       "\n",
       "          刊名        发表时间   被引     下载  操作  \n",
       "0     无线互联科技  2021-04-25  NaN   33.0  下载  \n",
       "1     无线互联科技  2021-04-25  NaN   20.0  下载  \n",
       "2    数字技术与应用  2021-04-25  NaN  153.0  下载  \n",
       "3     无线互联科技  2021-04-25  NaN   68.0  下载  \n",
       "4     无线互联科技  2021-04-25  NaN   20.0  下载  \n",
       "..       ...         ...  ...    ...  ..  \n",
       "245    农机化研究  2020-08-21  NaN  172.0  下载  \n",
       "246    电力大数据  2020-08-21  NaN   17.0  下载  \n",
       "247     上海质量  2020-08-20  NaN   32.0  下载  \n",
       "248     电子技术  2020-08-20  NaN  154.0  下载  \n",
       "249    黑龙江科学  2020-08-18  5.0  249.0  下载  \n",
       "\n",
       "[250 rows x 8 columns]"
      ]
     },
     "execution_count": 303,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_url_out = pd.concat(l_df).reset_index(drop=True)\n",
    "df_url_out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 304,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 详情链接\n",
    "href_group=[]\n",
    "\n",
    "for i in root_group:\n",
    "    href = i.xpath('.//*[@id=\"gridTable\"]/table/tbody/tr/td[2]/a/@href')\n",
    "    href_group.append(href)\n",
    "    \n",
    "href_group=href_group[0]+href_group[1]+href_group[2]+href_group[3]+href_group[4]+href_group[5]+href_group[6]+href_group[7]+href_group[8]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 305,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>详细页链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>445</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>446</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>447</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>448</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>449</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>450 rows × 1 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 详细页链接\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "..                                                 ...\n",
       "445  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "446  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "447  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "448  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "449  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "\n",
       "[450 rows x 1 columns]"
      ]
     },
     "execution_count": 305,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "href_group_correct=[correct(x) for x in href_group]\n",
    "df_link=pd.DataFrame({'详细页链接':href_group_correct})\n",
    "df_link"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 306,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n",
      "10\n",
      "11\n",
      "12\n",
      "13\n",
      "14\n",
      "15\n",
      "16\n",
      "17\n",
      "18\n",
      "19\n",
      "20\n",
      "21\n",
      "22\n",
      "23\n",
      "24\n",
      "25\n",
      "26\n",
      "27\n",
      "28\n",
      "29\n",
      "30\n",
      "31\n",
      "32\n",
      "33\n",
      "34\n",
      "35\n",
      "36\n",
      "37\n",
      "38\n",
      "39\n",
      "40\n",
      "41\n",
      "42\n",
      "43\n",
      "44\n",
      "45\n",
      "46\n",
      "47\n",
      "48\n",
      "49\n",
      "50\n",
      "51\n",
      "52\n",
      "53\n",
      "54\n",
      "55\n",
      "56\n",
      "57\n",
      "58\n",
      "59\n",
      "60\n",
      "61\n",
      "62\n",
      "63\n",
      "64\n",
      "65\n",
      "66\n",
      "67\n",
      "68\n",
      "69\n",
      "70\n",
      "71\n",
      "72\n",
      "73\n",
      "74\n",
      "75\n",
      "76\n",
      "77\n",
      "78\n",
      "79\n",
      "80\n",
      "81\n",
      "82\n",
      "83\n",
      "84\n",
      "85\n",
      "86\n",
      "87\n",
      "88\n",
      "89\n",
      "90\n",
      "91\n",
      "92\n",
      "93\n",
      "94\n",
      "95\n",
      "96\n",
      "97\n",
      "98\n",
      "99\n",
      "100\n",
      "101\n",
      "102\n",
      "103\n",
      "104\n",
      "105\n",
      "106\n",
      "107\n",
      "108\n",
      "109\n",
      "110\n",
      "111\n",
      "112\n",
      "113\n",
      "114\n",
      "115\n",
      "116\n",
      "117\n",
      "118\n",
      "119\n",
      "120\n",
      "121\n",
      "122\n",
      "123\n",
      "124\n",
      "125\n",
      "126\n",
      "127\n",
      "128\n",
      "129\n",
      "130\n",
      "131\n",
      "132\n",
      "133\n",
      "134\n",
      "135\n",
      "136\n",
      "137\n",
      "138\n",
      "139\n",
      "140\n",
      "141\n",
      "142\n",
      "143\n",
      "144\n",
      "145\n",
      "146\n",
      "147\n",
      "148\n",
      "149\n",
      "150\n",
      "151\n",
      "152\n",
      "153\n",
      "154\n",
      "155\n",
      "156\n",
      "157\n",
      "158\n",
      "159\n",
      "160\n",
      "161\n",
      "162\n",
      "163\n",
      "164\n",
      "165\n",
      "166\n",
      "167\n",
      "168\n",
      "169\n",
      "170\n",
      "171\n",
      "172\n",
      "173\n",
      "174\n",
      "175\n",
      "176\n",
      "177\n",
      "178\n",
      "179\n",
      "180\n",
      "181\n",
      "182\n",
      "183\n",
      "184\n",
      "185\n",
      "186\n",
      "187\n",
      "188\n",
      "189\n",
      "190\n",
      "191\n",
      "192\n",
      "193\n",
      "194\n",
      "195\n",
      "196\n",
      "197\n",
      "198\n",
      "199\n",
      "200\n",
      "201\n",
      "202\n",
      "203\n",
      "204\n",
      "205\n",
      "206\n",
      "207\n",
      "208\n",
      "209\n",
      "210\n",
      "211\n",
      "212\n",
      "213\n",
      "214\n",
      "215\n",
      "216\n",
      "217\n",
      "218\n",
      "219\n",
      "220\n",
      "221\n",
      "222\n",
      "223\n",
      "224\n",
      "225\n",
      "226\n",
      "227\n",
      "228\n",
      "229\n",
      "230\n",
      "231\n",
      "232\n",
      "233\n",
      "234\n",
      "235\n",
      "236\n",
      "237\n",
      "238\n",
      "239\n",
      "240\n",
      "241\n",
      "242\n",
      "243\n",
      "244\n",
      "245\n",
      "246\n",
      "247\n",
      "248\n",
      "249\n",
      "250\n",
      "251\n",
      "252\n",
      "253\n",
      "254\n",
      "255\n",
      "256\n",
      "257\n",
      "258\n",
      "259\n",
      "260\n",
      "261\n",
      "262\n",
      "263\n",
      "264\n",
      "265\n",
      "266\n",
      "267\n",
      "268\n",
      "269\n",
      "270\n",
      "271\n",
      "272\n",
      "273\n",
      "274\n",
      "275\n",
      "276\n",
      "277\n",
      "278\n",
      "279\n",
      "280\n",
      "281\n",
      "282\n",
      "283\n",
      "284\n",
      "285\n",
      "286\n",
      "287\n",
      "288\n",
      "289\n",
      "290\n",
      "291\n",
      "292\n",
      "293\n",
      "294\n",
      "295\n",
      "296\n",
      "297\n",
      "298\n",
      "299\n",
      "300\n",
      "301\n",
      "302\n",
      "303\n",
      "304\n",
      "305\n",
      "306\n",
      "307\n",
      "308\n",
      "309\n",
      "310\n",
      "311\n",
      "312\n",
      "313\n",
      "314\n",
      "315\n",
      "316\n",
      "317\n",
      "318\n",
      "319\n",
      "320\n",
      "321\n",
      "322\n",
      "323\n",
      "324\n",
      "325\n",
      "326\n",
      "327\n",
      "328\n",
      "329\n",
      "330\n",
      "331\n",
      "332\n",
      "333\n",
      "334\n",
      "335\n",
      "336\n",
      "337\n",
      "338\n",
      "339\n",
      "340\n",
      "341\n",
      "342\n",
      "343\n",
      "344\n",
      "345\n",
      "346\n",
      "347\n",
      "348\n",
      "349\n",
      "350\n",
      "351\n",
      "352\n",
      "353\n",
      "354\n",
      "355\n",
      "356\n",
      "357\n",
      "358\n",
      "359\n",
      "360\n",
      "361\n",
      "362\n",
      "363\n",
      "364\n",
      "365\n",
      "366\n",
      "367\n",
      "368\n",
      "369\n",
      "370\n",
      "371\n",
      "372\n",
      "373\n",
      "374\n",
      "375\n",
      "376\n",
      "377\n",
      "378\n",
      "379\n",
      "380\n",
      "381\n",
      "382\n",
      "383\n",
      "384\n",
      "385\n",
      "386\n",
      "387\n",
      "388\n",
      "389\n",
      "390\n",
      "391\n",
      "392\n",
      "393\n",
      "394\n",
      "395\n",
      "396\n",
      "397\n",
      "398\n",
      "399\n",
      "400\n",
      "401\n",
      "402\n",
      "403\n",
      "404\n",
      "405\n",
      "406\n",
      "407\n",
      "408\n",
      "409\n",
      "410\n",
      "411\n",
      "412\n",
      "413\n",
      "414\n",
      "415\n",
      "416\n",
      "417\n",
      "418\n",
      "419\n",
      "420\n",
      "421\n",
      "422\n",
      "423\n",
      "424\n",
      "425\n",
      "426\n",
      "427\n",
      "428\n",
      "429\n",
      "430\n",
      "431\n",
      "432\n",
      "433\n",
      "434\n",
      "435\n",
      "436\n",
      "437\n",
      "438\n",
      "439\n",
      "440\n",
      "441\n",
      "442\n",
      "443\n",
      "444\n",
      "445\n",
      "446\n",
      "447\n",
      "448\n",
      "449\n",
      "450\n"
     ]
    }
   ],
   "source": [
    "# PDF下载链接\n",
    "pdf_links=[]\n",
    "link_num = 0\n",
    "\n",
    "for url in href_group_correct:\n",
    "    try:\n",
    "        r = session.get(url)\n",
    "        pdf_link_xpath=r.html.xpath('//*[@id=\"pdfDown\"]/@href')[1]\n",
    "        pdf_links.append(pdf_link_xpath)\n",
    "        link_num += 1\n",
    "        print(link_num)\n",
    "    except:\n",
    "        continue\n",
    "    time.sleep(0.8)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 307,
   "metadata": {},
   "outputs": [],
   "source": [
    "pdf_links_correct=['https://kns.cnki.net'+link for link in pdf_links]\n",
    "df_pdf_download=pd.DataFrame({'PDF下载链接':pdf_links_correct})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 308,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_链接列表合并=pd.concat([df_link,df_pdf_download],axis=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 309,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_合并=pd.concat([df_url_out,df_链接列表合并],axis=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 310,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详情页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "      <th>详细页链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>基于计算机的大数据和云计算技术探析</td>\n",
       "      <td>马珺杰</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>2.0</td>\n",
       "      <td>大数据背景下的人工智能在计算机网络技术中的应用研究</td>\n",
       "      <td>王婧; 张学娜</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>3.0</td>\n",
       "      <td>大数据时代计算机网络安全防范分析</td>\n",
       "      <td>楚丙奇</td>\n",
       "      <td>办公自动化</td>\n",
       "      <td>2021-07-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>4.0</td>\n",
       "      <td>基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究</td>\n",
       "      <td>赵于卓; 黄子莹</td>\n",
       "      <td>中国商论</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>5.0</td>\n",
       "      <td>GIS专业自然地理学野外实习的教学改革实践</td>\n",
       "      <td>吴小芳; 钟晓兰; 谢刚生; 何正勇</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>49.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>495</th>\n",
       "      <td>445</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>496</th>\n",
       "      <td>446</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>497</th>\n",
       "      <td>447</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>498</th>\n",
       "      <td>448</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>499</th>\n",
       "      <td>449</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>500 rows × 12 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index  Unnamed: 0                            篇名                  作者  \\\n",
       "0        0         1.0             基于计算机的大数据和云计算技术探析                 马珺杰   \n",
       "1        1         2.0     大数据背景下的人工智能在计算机网络技术中的应用研究             王婧; 张学娜   \n",
       "2        2         3.0              大数据时代计算机网络安全防范分析                 楚丙奇   \n",
       "3        3         4.0  基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究            赵于卓; 黄子莹   \n",
       "4        4         5.0         GIS专业自然地理学野外实习的教学改革实践  吴小芳; 钟晓兰; 谢刚生; 何正勇   \n",
       "..     ...         ...                           ...                 ...   \n",
       "495    445         NaN                           NaN                 NaN   \n",
       "496    446         NaN                           NaN                 NaN   \n",
       "497    447         NaN                           NaN                 NaN   \n",
       "498    448         NaN                           NaN                 NaN   \n",
       "499    449         NaN                           NaN                 NaN   \n",
       "\n",
       "                 刊名        发表时间  被引    下载   操作  \\\n",
       "0    中小企业管理与科技(中旬刊)  2021-07-02 NaN   NaN   下载   \n",
       "1    中小企业管理与科技(中旬刊)  2021-07-02 NaN   NaN   下载   \n",
       "2             办公自动化  2021-07-01 NaN   NaN   下载   \n",
       "3              中国商论  2021-06-30 NaN   NaN   下载   \n",
       "4              测绘通报  2021-06-25 NaN  49.0   下载   \n",
       "..              ...         ...  ..   ...  ...   \n",
       "495             NaN         NaN NaN   NaN  NaN   \n",
       "496             NaN         NaN NaN   NaN  NaN   \n",
       "497             NaN         NaN NaN   NaN  NaN   \n",
       "498             NaN         NaN NaN   NaN  NaN   \n",
       "499             NaN         NaN NaN   NaN  NaN   \n",
       "\n",
       "                                                 详情页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "495                                                NaN   \n",
       "496                                                NaN   \n",
       "497                                                NaN   \n",
       "498                                                NaN   \n",
       "499                                                NaN   \n",
       "\n",
       "                                               PDF下载链接  \\\n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "..                                                 ...   \n",
       "495  https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "496  https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "497  https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "498  https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "499  https://kns.cnki.net/kcms/download.aspx?filena...   \n",
       "\n",
       "                                                 详细页链接  \n",
       "0                                                  NaN  \n",
       "1                                                  NaN  \n",
       "2                                                  NaN  \n",
       "3                                                  NaN  \n",
       "4                                                  NaN  \n",
       "..                                                 ...  \n",
       "495  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "496  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "497  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "498  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "499  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "\n",
       "[500 rows x 12 columns]"
      ]
     },
     "execution_count": 310,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_总表 = df_首页.append(df_合并).reset_index()\n",
    "df_总表"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 311,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 将内容表格存在本地\n",
    "with pd.ExcelWriter('cnki文章数据.xlsx',mode='w',engine=\"openpyxl\") as writer:  \n",
    "            df_总表.to_excel(writer,sheet_name=\"数据\")\n",
    "# display(df_总表)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 312,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 导出refworks文件"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 313,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath ('//*[@id=\"total\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 314,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14]\n"
     ]
    }
   ],
   "source": [
    "page = list(range(1,15))\n",
    "print(page)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 315,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 函数（翻页）\n",
    "def process_pages (pages):\n",
    "    for p in pages:\n",
    "        print (p,end='\\t')\n",
    "        # 定位到“下一页”的按钮 ——> 点击\n",
    "        跳转 = driver.find_element_by_id('PageNext')\n",
    "        跳转.click()\n",
    "        # 设定休息的时间 ——> 避免爬虫被禁报错、以及出现验证码\n",
    "        time.sleep(30+20*random())\n",
    "        # 获取含有页面主要数据的表格\n",
    "        element = driver.find_element_by_id('gridTable')\n",
    "        main_content = element.get_attribute('innerHTML')\n",
    "        表格_html[p] = main_content"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 320,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0\t1\t2\t3\t4\t"
     ]
    }
   ],
   "source": [
    "page_process(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 322,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出分析 \n",
    "element = driver.find_element_by_xpath('//i[@class=\"icon-d\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 323,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 点击导出文献\n",
    "element = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 324,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 选择Refworks\n",
    "element =driver.find_element_by_xpath('/html/body/div[3]/div[2]/div[2]/div[2]/form/div/div[1]/div[2]/ul[1]/li[2]/ul/li[1]/ul/li[8]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 342,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-629082E3B45570093EBFC0633EC53B94',\n",
       " 'CDwindow-3C3BD51F846E1D8E34ABBE5D4B52E434']"
      ]
     },
     "execution_count": 342,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 所有窗口ID\n",
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 343,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-343-df45c8daf1de>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[1])\n"
     ]
    }
   ],
   "source": [
    "# 跳转到第三个页面\n",
    "driver.switch_to_window(driver.window_handles[2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 点击学术期刊"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 344,
   "metadata": {},
   "outputs": [
    {
     "ename": "NoSuchElementException",
     "evalue": "Message: no such element: Unable to locate element: {\"method\":\"xpath\",\"selector\":\"//i[@class=\"icon icon-export\"]\"}\n  (Session info: chrome=91.0.4472.77)\n",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mNoSuchElementException\u001b[0m                    Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-344-c66e2c4007ed>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[1;31m# 导出 .txt文件\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 2\u001b[1;33m \u001b[0melement\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_xpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'//i[@class=\"icon icon-export\"]'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mclick\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m      3\u001b[0m \u001b[1;31m# 窗口切换批量导出页面\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element_by_xpath\u001b[1;34m(self, xpath)\u001b[0m\n\u001b[0;32m    392\u001b[0m             \u001b[0melement\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_xpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'//div/td[1]'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    393\u001b[0m         \"\"\"\n\u001b[1;32m--> 394\u001b[1;33m         \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mby\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mXPATH\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mxpath\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    395\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    396\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0mfind_elements_by_xpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mxpath\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element\u001b[1;34m(self, by, value)\u001b[0m\n\u001b[0;32m    974\u001b[0m                 \u001b[0mby\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mCSS_SELECTOR\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    975\u001b[0m                 \u001b[0mvalue\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;34m'[name=\"%s\"]'\u001b[0m \u001b[1;33m%\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 976\u001b[1;33m         return self.execute(Command.FIND_ELEMENT, {\n\u001b[0m\u001b[0;32m    977\u001b[0m             \u001b[1;34m'using'\u001b[0m\u001b[1;33m:\u001b[0m \u001b[0mby\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    978\u001b[0m             'value': value})['value']\n",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mexecute\u001b[1;34m(self, driver_command, params)\u001b[0m\n\u001b[0;32m    319\u001b[0m         \u001b[0mresponse\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcommand_executor\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mexecute\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdriver_command\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mparams\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    320\u001b[0m         \u001b[1;32mif\u001b[0m \u001b[0mresponse\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 321\u001b[1;33m             \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0merror_handler\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcheck_response\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mresponse\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    322\u001b[0m             response['value'] = self._unwrap_value(\n\u001b[0;32m    323\u001b[0m                 response.get('value', None))\n",
      "\u001b[1;32mC:\\ProgramData\\Anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\errorhandler.py\u001b[0m in \u001b[0;36mcheck_response\u001b[1;34m(self, response)\u001b[0m\n\u001b[0;32m    240\u001b[0m                 \u001b[0malert_text\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'alert'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'text'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    241\u001b[0m             \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0malert_text\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 242\u001b[1;33m         \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    243\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    244\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0m_value_or_default\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mobj\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mdefault\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mNoSuchElementException\u001b[0m: Message: no such element: Unable to locate element: {\"method\":\"xpath\",\"selector\":\"//i[@class=\"icon icon-export\"]\"}\n  (Session info: chrome=91.0.4472.77)\n"
     ]
    }
   ],
   "source": [
    "# 导出 .txt文件\n",
    "element = driver.find_element_by_xpath('//i[@class=\"icon icon-export\"]').click()\n",
    "# 窗口切换批量导出页面"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 336,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 341,
   "metadata": {},
   "outputs": [
    {
     "ename": "SyntaxError",
     "evalue": "EOL while scanning string literal (<ipython-input-341-d2d6b5e6c9cb>, line 2)",
     "output_type": "error",
     "traceback": [
      "\u001b[1;36m  File \u001b[1;32m\"<ipython-input-341-d2d6b5e6c9cb>\"\u001b[1;36m, line \u001b[1;32m2\u001b[0m\n\u001b[1;33m    query = 'SU = \"计算机\" AND  (TI =\"人工智能\" OR  TI =\"大数据\"  OR TI = \"AI\" OR TI = \"big data\")\u001b[0m\n\u001b[1;37m                                                                                        ^\u001b[0m\n\u001b[1;31mSyntaxError\u001b[0m\u001b[1;31m:\u001b[0m EOL while scanning string literal\n"
     ]
    }
   ],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 339,
   "metadata": {},
   "outputs": [],
   "source": [
    " "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 340,
   "metadata": {},
   "outputs": [],
   "source": [
    " "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 模拟翻页"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 点击下一页"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 91,
   "metadata": {},
   "outputs": [],
   "source": [
    "element=driver.find_element_by_id('PageNext')\n",
    "element.get_attribute('innerHTML')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 92,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 第一页开始"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "metadata": {},
   "outputs": [],
   "source": [
    "element=driver.find_element_by_id('page1')\n",
    "element.get_attribute('innerHTML')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 94,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 翻页页数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 95,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[0, 1, 2, 3, 4]\n"
     ]
    }
   ],
   "source": [
    "pages = list(range(0,5))\n",
    "print(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 96,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 翻页函数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 97,
   "metadata": {},
   "outputs": [],
   "source": [
    " 表格_html=dict()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 98,
   "metadata": {},
   "outputs": [],
   "source": [
    "def fanye_pages (pages):\n",
    "    for p in pages:\n",
    "        print (p,end='\\t')\n",
    "        # 点击下一页\n",
    "        下一页 = driver.find_element_by_id('PageNext')\n",
    "        下一页.click()\n",
    "        # 设定休息的时间 ——> 避免爬虫被禁报错、以及出现验证码\n",
    "        time.sleep(10)\n",
    "        # 获取含有页面主要数据的表格\n",
    "        element = driver.find_element_by_id('gridTable')\n",
    "        main_content = element.get_attribute('innerHTML')\n",
    "        表格_html[p] = main_content"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 99,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0\t1\t2\t3\t4\t"
     ]
    }
   ],
   "source": [
    "fanye_pages(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 100,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 数据表格化"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 101,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>51</td>\n",
       "      <td>大数据时代下计算机科学与技术专业综合改革</td>\n",
       "      <td>李洁</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>大数据背景下的计算机专业教学改革探讨</td>\n",
       "      <td>刘英</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>大数据时代计算机网络的安全问题及防范措施</td>\n",
       "      <td>赵培植</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>153.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>大数据时代计算机网络安全问题及对策分析</td>\n",
       "      <td>王研</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>68.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>大数据技术在计算机网络数据库建设中的运用</td>\n",
       "      <td>李少敏; 陈升晖</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-04-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>296</td>\n",
       "      <td>大数据时代人工智能在计算机网络技术中的应用</td>\n",
       "      <td>李斯</td>\n",
       "      <td>信息与电脑(理论版)</td>\n",
       "      <td>2020-11-10</td>\n",
       "      <td>1.0</td>\n",
       "      <td>32.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>297</td>\n",
       "      <td>计算机图像识别技术“AI+安防”助力服务实战应用研究</td>\n",
       "      <td>姜威</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2020-11-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>169.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>298</td>\n",
       "      <td>地理信息系统软件在物流地理教学中的应用研究</td>\n",
       "      <td>蔡丽玲; 缪桂根</td>\n",
       "      <td>物流科技</td>\n",
       "      <td>2020-11-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>68.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>299</td>\n",
       "      <td>大数据背景下的计算机网络信息安全分析</td>\n",
       "      <td>刘慧慧</td>\n",
       "      <td>科技创新与生产力</td>\n",
       "      <td>2020-11-10</td>\n",
       "      <td>3.0</td>\n",
       "      <td>85.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>300</td>\n",
       "      <td>基于大数据的并行化深度卷积神经网络优化算法</td>\n",
       "      <td>毛伊敏; 张瑞朋; 曹文梁</td>\n",
       "      <td>计算机应用研究</td>\n",
       "      <td>2020-11-09 16:57</td>\n",
       "      <td>NaN</td>\n",
       "      <td>207.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>250 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                          篇名             作者          刊名  \\\n",
       "0           51        大数据时代下计算机科学与技术专业综合改革             李洁      无线互联科技   \n",
       "1           52          大数据背景下的计算机专业教学改革探讨             刘英      无线互联科技   \n",
       "2           53        大数据时代计算机网络的安全问题及防范措施            赵培植     数字技术与应用   \n",
       "3           54         大数据时代计算机网络安全问题及对策分析             王研      无线互联科技   \n",
       "4           55        大数据技术在计算机网络数据库建设中的运用       李少敏; 陈升晖      无线互联科技   \n",
       "..         ...                         ...            ...         ...   \n",
       "45         296       大数据时代人工智能在计算机网络技术中的应用             李斯  信息与电脑(理论版)   \n",
       "46         297  计算机图像识别技术“AI+安防”助力服务实战应用研究             姜威   网络安全技术与应用   \n",
       "47         298       地理信息系统软件在物流地理教学中的应用研究       蔡丽玲; 缪桂根        物流科技   \n",
       "48         299          大数据背景下的计算机网络信息安全分析            刘慧慧    科技创新与生产力   \n",
       "49         300       基于大数据的并行化深度卷积神经网络优化算法  毛伊敏; 张瑞朋; 曹文梁     计算机应用研究   \n",
       "\n",
       "                发表时间   被引     下载  操作  \n",
       "0         2021-04-25  NaN   33.0  下载  \n",
       "1         2021-04-25  NaN   20.0  下载  \n",
       "2         2021-04-25  NaN  153.0  下载  \n",
       "3         2021-04-25  NaN   68.0  下载  \n",
       "4         2021-04-25  NaN   20.0  下载  \n",
       "..               ...  ...    ...  ..  \n",
       "45        2020-11-10  1.0   32.0  下载  \n",
       "46        2020-11-10  NaN  169.0  下载  \n",
       "47        2020-11-10  NaN   68.0  下载  \n",
       "48        2020-11-10  3.0   85.0  下载  \n",
       "49  2020-11-09 16:57  NaN  207.0  下载  \n",
       "\n",
       "[250 rows x 8 columns]"
      ]
     },
     "execution_count": 101,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_收集 = []\n",
    "for p in pages:\n",
    "    表格 = pd.read_html(表格_html[p])[0]\n",
    "    df_收集.append(表格)\n",
    "df_收集=pd.concat(df_收集)\n",
    "df_收集"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 102,
   "metadata": {},
   "outputs": [],
   "source": [
    "## 导出页面表格"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 103,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>基于计算机的大数据和云计算技术探析</td>\n",
       "      <td>马珺杰</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>大数据背景下的人工智能在计算机网络技术中的应用研究</td>\n",
       "      <td>王婧; 张学娜</td>\n",
       "      <td>中小企业管理与科技(中旬刊)</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>大数据时代计算机网络安全防范分析</td>\n",
       "      <td>楚丙奇</td>\n",
       "      <td>办公自动化</td>\n",
       "      <td>2021-07-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究</td>\n",
       "      <td>赵于卓; 黄子莹</td>\n",
       "      <td>中国商论</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>5</td>\n",
       "      <td>GIS专业自然地理学野外实习的教学改革实践</td>\n",
       "      <td>吴小芳; 钟晓兰; 谢刚生; 何正勇</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>49.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>295</th>\n",
       "      <td>45</td>\n",
       "      <td>296</td>\n",
       "      <td>大数据时代人工智能在计算机网络技术中的应用</td>\n",
       "      <td>李斯</td>\n",
       "      <td>信息与电脑(理论版)</td>\n",
       "      <td>2020-11-10</td>\n",
       "      <td>1.0</td>\n",
       "      <td>32.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>296</th>\n",
       "      <td>46</td>\n",
       "      <td>297</td>\n",
       "      <td>计算机图像识别技术“AI+安防”助力服务实战应用研究</td>\n",
       "      <td>姜威</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2020-11-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>169.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>297</th>\n",
       "      <td>47</td>\n",
       "      <td>298</td>\n",
       "      <td>地理信息系统软件在物流地理教学中的应用研究</td>\n",
       "      <td>蔡丽玲; 缪桂根</td>\n",
       "      <td>物流科技</td>\n",
       "      <td>2020-11-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>68.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>298</th>\n",
       "      <td>48</td>\n",
       "      <td>299</td>\n",
       "      <td>大数据背景下的计算机网络信息安全分析</td>\n",
       "      <td>刘慧慧</td>\n",
       "      <td>科技创新与生产力</td>\n",
       "      <td>2020-11-10</td>\n",
       "      <td>3.0</td>\n",
       "      <td>85.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>299</th>\n",
       "      <td>49</td>\n",
       "      <td>300</td>\n",
       "      <td>基于大数据的并行化深度卷积神经网络优化算法</td>\n",
       "      <td>毛伊敏; 张瑞朋; 曹文梁</td>\n",
       "      <td>计算机应用研究</td>\n",
       "      <td>2020-11-09 16:57</td>\n",
       "      <td>NaN</td>\n",
       "      <td>207.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>300 rows × 9 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index  Unnamed: 0                            篇名                  作者  \\\n",
       "0        0           1             基于计算机的大数据和云计算技术探析                 马珺杰   \n",
       "1        1           2     大数据背景下的人工智能在计算机网络技术中的应用研究             王婧; 张学娜   \n",
       "2        2           3              大数据时代计算机网络安全防范分析                 楚丙奇   \n",
       "3        3           4  基于舞弊三角理论的GA-BP舞弊智能识别与大数据应用研究            赵于卓; 黄子莹   \n",
       "4        4           5         GIS专业自然地理学野外实习的教学改革实践  吴小芳; 钟晓兰; 谢刚生; 何正勇   \n",
       "..     ...         ...                           ...                 ...   \n",
       "295     45         296         大数据时代人工智能在计算机网络技术中的应用                  李斯   \n",
       "296     46         297    计算机图像识别技术“AI+安防”助力服务实战应用研究                  姜威   \n",
       "297     47         298         地理信息系统软件在物流地理教学中的应用研究            蔡丽玲; 缪桂根   \n",
       "298     48         299            大数据背景下的计算机网络信息安全分析                 刘慧慧   \n",
       "299     49         300         基于大数据的并行化深度卷积神经网络优化算法       毛伊敏; 张瑞朋; 曹文梁   \n",
       "\n",
       "                 刊名              发表时间   被引     下载  操作  \n",
       "0    中小企业管理与科技(中旬刊)        2021-07-02  NaN    NaN  下载  \n",
       "1    中小企业管理与科技(中旬刊)        2021-07-02  NaN    NaN  下载  \n",
       "2             办公自动化        2021-07-01  NaN    NaN  下载  \n",
       "3              中国商论        2021-06-30  NaN    NaN  下载  \n",
       "4              测绘通报        2021-06-25  NaN   49.0  下载  \n",
       "..              ...               ...  ...    ...  ..  \n",
       "295      信息与电脑(理论版)        2020-11-10  1.0   32.0  下载  \n",
       "296       网络安全技术与应用        2020-11-10  NaN  169.0  下载  \n",
       "297            物流科技        2020-11-10  NaN   68.0  下载  \n",
       "298        科技创新与生产力        2020-11-10  3.0   85.0  下载  \n",
       "299         计算机应用研究  2020-11-09 16:57  NaN  207.0  下载  \n",
       "\n",
       "[300 rows x 9 columns]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "df_总表格 = df_第一页页面表格.append(df_收集).reset_index()\n",
    "display(df_总表格)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 104,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_总表格.to_excel('知网文章页面数据.xlsx',sheet_name=\"250篇\")#将表格信息以EXCEL文件形式存储在本地"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.5"
  },
  "toc": {
   "base_numbering": 1,
   "nav_menu": {},
   "number_sections": true,
   "sideBar": true,
   "skip_h1_title": false,
   "title_cell": "Table of Contents",
   "title_sidebar": "Contents",
   "toc_cell": false,
   "toc_position": {},
   "toc_section_display": true,
   "toc_window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
